1 //=- AArch64SchedA57.td - ARM Cortex-A57 Scheduling Defs -----*- tablegen -*-=//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file defines the machine model for ARM Cortex-A57 to support
10 // instruction scheduling and other instruction cost heuristics.
12 //===----------------------------------------------------------------------===//
14 //===----------------------------------------------------------------------===//
15 // The Cortex-A57 is a traditional superscalar microprocessor with a
16 // conservative 3-wide in-order stage for decode and dispatch. Combined with the
17 // much wider out-of-order issue stage, this produced a need to carefully
18 // schedule micro-ops so that all three decoded each cycle are successfully
19 // issued as the reservation station(s) simply don't stay occupied for long.
20 // Therefore, IssueWidth is set to the narrower of the two at three, while still
21 // modeling the machine as out-of-order.
23 def CortexA57Model : SchedMachineModel {
24 let IssueWidth = 3; // 3-way decode and dispatch
25 let MicroOpBufferSize = 128; // 128 micro-op re-order buffer
26 let LoadLatency = 4; // Optimistic load latency
27 let MispredictPenalty = 14; // Fetch + Decode/Rename/Dispatch + Branch
29 // Enable partial & runtime unrolling. The magic number is chosen based on
30 // experiments and benchmarking data.
31 let LoopMicroOpBufferSize = 16;
32 let CompleteModel = 1;
34 list<Predicate> UnsupportedFeatures = !listconcat(SVEUnsupported.F,
39 //===----------------------------------------------------------------------===//
40 // Define each kind of processor resource and number available on Cortex-A57.
41 // Cortex A-57 has 8 pipelines that each has its own 8-entry queue where
42 // micro-ops wait for their operands and then issue out-of-order.
44 def A57UnitB : ProcResource<1>; // Type B micro-ops
45 def A57UnitI : ProcResource<2>; // Type I micro-ops
46 def A57UnitM : ProcResource<1>; // Type M micro-ops
47 def A57UnitL : ProcResource<1>; // Type L micro-ops
48 def A57UnitS : ProcResource<1>; // Type S micro-ops
49 def A57UnitX : ProcResource<1>; // Type X micro-ops
50 def A57UnitW : ProcResource<1>; // Type W micro-ops
51 let SchedModel = CortexA57Model in {
52 def A57UnitV : ProcResGroup<[A57UnitX, A57UnitW]>; // Type V micro-ops
55 let SchedModel = CortexA57Model in {
57 //===----------------------------------------------------------------------===//
58 // Define customized scheduler read/write types specific to the Cortex-A57.
60 include "AArch64SchedA57WriteRes.td"
62 //===----------------------------------------------------------------------===//
63 // Map the target-defined scheduler read/write resources and latency for
64 // Cortex-A57. The Cortex-A57 types are directly associated with resources, so
65 // defining the aliases precludes the need for mapping them using WriteRes. The
66 // aliases are sufficient for creating a coarse, working model. As the model
67 // evolves, InstRWs will be used to override some of these SchedAliases.
69 // WARNING: Using SchedAliases is convenient and works well for latency and
70 // resource lookup for instructions. However, this creates an entry in
71 // AArch64WriteLatencyTable with a WriteResourceID of 0, breaking
72 // any SchedReadAdvance since the lookup will fail.
74 def : SchedAlias<WriteImm, A57Write_1cyc_1I>;
75 def : SchedAlias<WriteI, A57Write_1cyc_1I>;
76 def : SchedAlias<WriteISReg, A57Write_2cyc_1M>;
77 def : SchedAlias<WriteIEReg, A57Write_2cyc_1M>;
78 def : SchedAlias<WriteExtr, A57Write_1cyc_1I>;
79 def : SchedAlias<WriteIS, A57Write_1cyc_1I>;
80 def : SchedAlias<WriteID32, A57Write_19cyc_1M>;
81 def : SchedAlias<WriteID64, A57Write_35cyc_1M>;
82 def : WriteRes<WriteIM32, [A57UnitM]> { let Latency = 3; }
83 def : WriteRes<WriteIM64, [A57UnitM]> { let Latency = 5; }
84 def : SchedAlias<WriteBr, A57Write_1cyc_1B>;
85 def : SchedAlias<WriteBrReg, A57Write_1cyc_1B>;
86 def : SchedAlias<WriteLD, A57Write_4cyc_1L>;
87 def : SchedAlias<WriteST, A57Write_1cyc_1S>;
88 def : SchedAlias<WriteSTP, A57Write_1cyc_1S>;
89 def : SchedAlias<WriteAdr, A57Write_1cyc_1I>;
90 def : SchedAlias<WriteLDIdx, A57Write_4cyc_1I_1L>;
91 def : SchedAlias<WriteSTIdx, A57Write_1cyc_1I_1S>;
92 def : SchedAlias<WriteF, A57Write_3cyc_1V>;
93 def : SchedAlias<WriteFCmp, A57Write_3cyc_1V>;
94 def : SchedAlias<WriteFCvt, A57Write_5cyc_1V>;
95 def : SchedAlias<WriteFCopy, A57Write_5cyc_1L>;
96 def : SchedAlias<WriteFImm, A57Write_3cyc_1V>;
97 def : WriteRes<WriteFMul, [A57UnitV]> { let Latency = 5;}
98 def : SchedAlias<WriteFDiv, A57Write_17cyc_1W>;
99 def : SchedAlias<WriteV, A57Write_3cyc_1V>;
100 def : SchedAlias<WriteVLD, A57Write_5cyc_1L>;
101 def : SchedAlias<WriteVST, A57Write_1cyc_1S>;
103 def : WriteRes<WriteAtomic, []> { let Unsupported = 1; }
105 def : WriteRes<WriteSys, []> { let Latency = 1; }
106 def : WriteRes<WriteBarrier, []> { let Latency = 1; }
107 def : WriteRes<WriteHint, []> { let Latency = 1; }
109 def : WriteRes<WriteLDHi, []> { let Latency = 4; }
111 // Forwarding logic is only modeled for multiply and accumulate
112 def : ReadAdvance<ReadI, 0>;
113 def : ReadAdvance<ReadISReg, 0>;
114 def : ReadAdvance<ReadIEReg, 0>;
115 def : ReadAdvance<ReadIM, 0>;
116 def : ReadAdvance<ReadIMA, 2, [WriteIM32, WriteIM64]>;
117 def : ReadAdvance<ReadID, 0>;
118 def : ReadAdvance<ReadExtrHi, 0>;
119 def : ReadAdvance<ReadAdrBase, 0>;
120 def : ReadAdvance<ReadVLD, 0>;
123 //===----------------------------------------------------------------------===//
124 // Specialize the coarse model by associating instruction groups with the
125 // subtarget-defined types. As the modeled is refined, this will override most
126 // of the above ShchedAlias mappings.
129 // -----------------------------------------------------------------------------
131 def : InstRW<[WriteI], (instrs COPY)>;
134 // Branch Instructions
135 // -----------------------------------------------------------------------------
137 def : InstRW<[A57Write_1cyc_1B_1I], (instrs BL)>;
138 def : InstRW<[A57Write_2cyc_1B_1I], (instrs BLR)>;
141 // Shifted Register with Shift == 0
142 // ----------------------------------------------------------------------------
144 def A57WriteISReg : SchedWriteVariant<[
145 SchedVar<RegShiftedPred, [WriteISReg]>,
146 SchedVar<NoSchedPred, [WriteI]>]>;
147 def : InstRW<[A57WriteISReg], (instregex ".*rs$")>;
150 // Divide and Multiply Instructions
151 // -----------------------------------------------------------------------------
154 def : InstRW<[A57Write_6cyc_1M], (instrs SMULHrr, UMULHrr)>;
157 // Miscellaneous Data-Processing Instructions
158 // -----------------------------------------------------------------------------
160 def : InstRW<[A57Write_1cyc_1I], (instrs EXTRWrri)>;
161 def : InstRW<[A57Write_3cyc_1I_1M], (instrs EXTRXrri)>;
162 def : InstRW<[A57Write_2cyc_1M], (instregex "BFM")>;
165 // Cryptography Extensions
166 // -----------------------------------------------------------------------------
168 def A57ReadAES : SchedReadAdvance<3, [A57Write_3cyc_1W]>;
169 def : InstRW<[A57Write_3cyc_1W], (instregex "^AES[DE]")>;
170 def : InstRW<[A57Write_3cyc_1W, A57ReadAES], (instregex "^AESI?MC")>;
171 def : InstRW<[A57Write_6cyc_2V], (instregex "^SHA1SU0")>;
172 def : InstRW<[A57Write_3cyc_1W], (instregex "^SHA1(H|SU1)")>;
173 def : InstRW<[A57Write_6cyc_2W], (instregex "^SHA1[CMP]")>;
174 def : InstRW<[A57Write_3cyc_1W], (instregex "^SHA256SU0")>;
175 def : InstRW<[A57Write_6cyc_2W], (instregex "^SHA256(H|H2|SU1)")>;
176 def : InstRW<[A57Write_3cyc_1W], (instregex "^CRC32")>;
180 // -----------------------------------------------------------------------------
182 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1i(8|16|32)$")>;
183 def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD1i(8|16|32)_POST$")>;
184 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1i(64)$")>;
185 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instregex "LD1i(64)_POST$")>;
187 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1Rv(8b|4h|2s)$")>;
188 def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD1Rv(8b|4h|2s)_POST$")>;
189 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Rv(1d)$")>;
190 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instregex "LD1Rv(1d)_POST$")>;
191 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1Rv(16b|8h|4s|2d)$")>;
192 def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD1Rv(16b|8h|4s|2d)_POST$")>;
194 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Onev(8b|4h|2s|1d)$")>;
195 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instregex "LD1Onev(8b|4h|2s|1d)_POST$")>;
196 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Onev(16b|8h|4s|2d)$")>;
197 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instregex "LD1Onev(16b|8h|4s|2d)_POST$")>;
198 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Twov(8b|4h|2s|1d)$")>;
199 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instregex "LD1Twov(8b|4h|2s|1d)_POST$")>;
200 def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Twov(16b|8h|4s|2d)$")>;
201 def : InstRW<[A57Write_6cyc_2L, WriteAdr], (instregex "LD1Twov(16b|8h|4s|2d)_POST$")>;
202 def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Threev(8b|4h|2s|1d)$")>;
203 def : InstRW<[A57Write_6cyc_2L, WriteAdr], (instregex "LD1Threev(8b|4h|2s|1d)_POST$")>;
204 def : InstRW<[A57Write_7cyc_3L], (instregex "LD1Threev(16b|8h|4s|2d)$")>;
205 def : InstRW<[A57Write_7cyc_3L, WriteAdr], (instregex "LD1Threev(16b|8h|4s|2d)_POST$")>;
206 def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Fourv(8b|4h|2s|1d)$")>;
207 def : InstRW<[A57Write_6cyc_2L, WriteAdr], (instregex "LD1Fourv(8b|4h|2s|1d)_POST$")>;
208 def : InstRW<[A57Write_8cyc_4L], (instregex "LD1Fourv(16b|8h|4s|2d)$")>;
209 def : InstRW<[A57Write_8cyc_4L, WriteAdr], (instregex "LD1Fourv(16b|8h|4s|2d)_POST$")>;
211 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD2i(8|16)$")>;
212 def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr], (instregex "LD2i(8|16)_POST$")>;
213 def : InstRW<[A57Write_6cyc_2L], (instregex "LD2i(32)$")>;
214 def : InstRW<[A57Write_6cyc_2L, WriteAdr], (instregex "LD2i(32)_POST$")>;
215 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2i(64)$")>;
216 def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD2i(64)_POST$")>;
218 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2Rv(8b|4h|2s)$")>;
219 def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD2Rv(8b|4h|2s)_POST$")>;
220 def : InstRW<[A57Write_5cyc_1L], (instregex "LD2Rv(1d)$")>;
221 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instregex "LD2Rv(1d)_POST$")>;
222 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD2Rv(16b|8h|4s|2d)$")>;
223 def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr], (instregex "LD2Rv(16b|8h|4s|2d)_POST$")>;
225 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2Twov(8b|4h|2s)$")>;
226 def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD2Twov(8b|4h|2s)_POST$")>;
227 def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD2Twov(16b|8h|4s)$")>;
228 def : InstRW<[A57Write_9cyc_2L_2V, WriteAdr], (instregex "LD2Twov(16b|8h|4s)_POST$")>;
229 def : InstRW<[A57Write_6cyc_2L], (instregex "LD2Twov(2d)$")>;
230 def : InstRW<[A57Write_6cyc_2L, WriteAdr], (instregex "LD2Twov(2d)_POST$")>;
232 def : InstRW<[A57Write_9cyc_1L_3V], (instregex "LD3i(8|16)$")>;
233 def : InstRW<[A57Write_9cyc_1L_3V, WriteAdr], (instregex "LD3i(8|16)_POST$")>;
234 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD3i(32)$")>;
235 def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr], (instregex "LD3i(32)_POST$")>;
236 def : InstRW<[A57Write_6cyc_2L], (instregex "LD3i(64)$")>;
237 def : InstRW<[A57Write_6cyc_2L, WriteAdr], (instregex "LD3i(64)_POST$")>;
239 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD3Rv(8b|4h|2s)$")>;
240 def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr], (instregex "LD3Rv(8b|4h|2s)_POST$")>;
241 def : InstRW<[A57Write_6cyc_2L], (instregex "LD3Rv(1d)$")>;
242 def : InstRW<[A57Write_6cyc_2L, WriteAdr], (instregex "LD3Rv(1d)_POST$")>;
243 def : InstRW<[A57Write_9cyc_1L_3V], (instregex "LD3Rv(16b|8h|4s)$")>;
244 def : InstRW<[A57Write_9cyc_1L_3V, WriteAdr], (instregex "LD3Rv(16b|8h|4s)_POST$")>;
245 def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD3Rv(2d)$")>;
246 def : InstRW<[A57Write_9cyc_2L_3V, WriteAdr], (instregex "LD3Rv(2d)_POST$")>;
248 def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD3Threev(8b|4h|2s)$")>;
249 def : InstRW<[A57Write_9cyc_2L_2V, WriteAdr], (instregex "LD3Threev(8b|4h|2s)_POST$")>;
250 def : InstRW<[A57Write_10cyc_3L_4V], (instregex "LD3Threev(16b|8h|4s)$")>;
251 def : InstRW<[A57Write_10cyc_3L_4V, WriteAdr], (instregex "LD3Threev(16b|8h|4s)_POST$")>;
252 def : InstRW<[A57Write_8cyc_4L], (instregex "LD3Threev(2d)$")>;
253 def : InstRW<[A57Write_8cyc_4L, WriteAdr], (instregex "LD3Threev(2d)_POST$")>;
255 def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4i(8|16)$")>;
256 def : InstRW<[A57Write_9cyc_2L_3V, WriteAdr], (instregex "LD4i(8|16)_POST$")>;
257 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD4i(32)$")>;
258 def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr], (instregex "LD4i(32)_POST$")>;
259 def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4i(64)$")>;
260 def : InstRW<[A57Write_9cyc_2L_3V, WriteAdr], (instregex "LD4i(64)_POST$")>;
262 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD4Rv(8b|4h|2s)$")>;
263 def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr], (instregex "LD4Rv(8b|4h|2s)_POST$")>;
264 def : InstRW<[A57Write_6cyc_2L], (instregex "LD4Rv(1d)$")>;
265 def : InstRW<[A57Write_6cyc_2L, WriteAdr], (instregex "LD4Rv(1d)_POST$")>;
266 def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4Rv(16b|8h|4s)$")>;
267 def : InstRW<[A57Write_9cyc_2L_3V, WriteAdr], (instregex "LD4Rv(16b|8h|4s)_POST$")>;
268 def : InstRW<[A57Write_9cyc_2L_4V], (instregex "LD4Rv(2d)$")>;
269 def : InstRW<[A57Write_9cyc_2L_4V, WriteAdr], (instregex "LD4Rv(2d)_POST$")>;
271 def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD4Fourv(8b|4h|2s)$")>;
272 def : InstRW<[A57Write_9cyc_2L_2V, WriteAdr], (instregex "LD4Fourv(8b|4h|2s)_POST$")>;
273 def : InstRW<[A57Write_11cyc_4L_4V], (instregex "LD4Fourv(16b|8h|4s)$")>;
274 def : InstRW<[A57Write_11cyc_4L_4V, WriteAdr], (instregex "LD4Fourv(16b|8h|4s)_POST$")>;
275 def : InstRW<[A57Write_8cyc_4L], (instregex "LD4Fourv(2d)$")>;
276 def : InstRW<[A57Write_8cyc_4L, WriteAdr], (instregex "LD4Fourv(2d)_POST$")>;
279 // -----------------------------------------------------------------------------
281 def : InstRW<[A57Write_1cyc_1S], (instregex "ST1i(8|16|32)$")>;
282 def : InstRW<[A57Write_1cyc_1S, WriteAdr], (instregex "ST1i(8|16|32)_POST$")>;
283 def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST1i(64)$")>;
284 def : InstRW<[A57Write_3cyc_1S_1V, WriteAdr], (instregex "ST1i(64)_POST$")>;
286 def : InstRW<[A57Write_1cyc_1S], (instregex "ST1Onev(8b|4h|2s|1d)$")>;
287 def : InstRW<[A57Write_1cyc_1S, WriteAdr], (instregex "ST1Onev(8b|4h|2s|1d)_POST$")>;
288 def : InstRW<[A57Write_2cyc_2S], (instregex "ST1Onev(16b|8h|4s|2d)$")>;
289 def : InstRW<[A57Write_2cyc_2S, WriteAdr], (instregex "ST1Onev(16b|8h|4s|2d)_POST$")>;
290 def : InstRW<[A57Write_2cyc_2S], (instregex "ST1Twov(8b|4h|2s|1d)$")>;
291 def : InstRW<[A57Write_2cyc_2S, WriteAdr], (instregex "ST1Twov(8b|4h|2s|1d)_POST$")>;
292 def : InstRW<[A57Write_4cyc_4S], (instregex "ST1Twov(16b|8h|4s|2d)$")>;
293 def : InstRW<[A57Write_4cyc_4S, WriteAdr], (instregex "ST1Twov(16b|8h|4s|2d)_POST$")>;
294 def : InstRW<[A57Write_3cyc_3S], (instregex "ST1Threev(8b|4h|2s|1d)$")>;
295 def : InstRW<[A57Write_3cyc_3S, WriteAdr], (instregex "ST1Threev(8b|4h|2s|1d)_POST$")>;
296 def : InstRW<[A57Write_6cyc_6S], (instregex "ST1Threev(16b|8h|4s|2d)$")>;
297 def : InstRW<[A57Write_6cyc_6S, WriteAdr], (instregex "ST1Threev(16b|8h|4s|2d)_POST$")>;
298 def : InstRW<[A57Write_4cyc_4S], (instregex "ST1Fourv(8b|4h|2s|1d)$")>;
299 def : InstRW<[A57Write_4cyc_4S, WriteAdr], (instregex "ST1Fourv(8b|4h|2s|1d)_POST$")>;
300 def : InstRW<[A57Write_8cyc_8S], (instregex "ST1Fourv(16b|8h|4s|2d)$")>;
301 def : InstRW<[A57Write_8cyc_8S, WriteAdr], (instregex "ST1Fourv(16b|8h|4s|2d)_POST$")>;
303 def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST2i(8|16|32)$")>;
304 def : InstRW<[A57Write_3cyc_1S_1V, WriteAdr], (instregex "ST2i(8|16|32)_POST$")>;
305 def : InstRW<[A57Write_2cyc_2S], (instregex "ST2i(64)$")>;
306 def : InstRW<[A57Write_2cyc_2S, WriteAdr], (instregex "ST2i(64)_POST$")>;
308 def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST2Twov(8b|4h|2s)$")>;
309 def : InstRW<[A57Write_3cyc_2S_1V, WriteAdr], (instregex "ST2Twov(8b|4h|2s)_POST$")>;
310 def : InstRW<[A57Write_4cyc_4S_2V], (instregex "ST2Twov(16b|8h|4s)$")>;
311 def : InstRW<[A57Write_4cyc_4S_2V, WriteAdr], (instregex "ST2Twov(16b|8h|4s)_POST$")>;
312 def : InstRW<[A57Write_4cyc_4S], (instregex "ST2Twov(2d)$")>;
313 def : InstRW<[A57Write_4cyc_4S, WriteAdr], (instregex "ST2Twov(2d)_POST$")>;
315 def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST3i(8|16)$")>;
316 def : InstRW<[A57Write_3cyc_1S_1V, WriteAdr], (instregex "ST3i(8|16)_POST$")>;
317 def : InstRW<[A57Write_3cyc_3S], (instregex "ST3i(32)$")>;
318 def : InstRW<[A57Write_3cyc_3S, WriteAdr], (instregex "ST3i(32)_POST$")>;
319 def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST3i(64)$")>;
320 def : InstRW<[A57Write_3cyc_2S_1V, WriteAdr], (instregex "ST3i(64)_POST$")>;
322 def : InstRW<[A57Write_3cyc_3S_2V], (instregex "ST3Threev(8b|4h|2s)$")>;
323 def : InstRW<[A57Write_3cyc_3S_2V, WriteAdr], (instregex "ST3Threev(8b|4h|2s)_POST$")>;
324 def : InstRW<[A57Write_6cyc_6S_4V], (instregex "ST3Threev(16b|8h|4s)$")>;
325 def : InstRW<[A57Write_6cyc_6S_4V, WriteAdr], (instregex "ST3Threev(16b|8h|4s)_POST$")>;
326 def : InstRW<[A57Write_6cyc_6S], (instregex "ST3Threev(2d)$")>;
327 def : InstRW<[A57Write_6cyc_6S, WriteAdr], (instregex "ST3Threev(2d)_POST$")>;
329 def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST4i(8|16)$")>;
330 def : InstRW<[A57Write_3cyc_1S_1V, WriteAdr], (instregex "ST4i(8|16)_POST$")>;
331 def : InstRW<[A57Write_4cyc_4S], (instregex "ST4i(32)$")>;
332 def : InstRW<[A57Write_4cyc_4S, WriteAdr], (instregex "ST4i(32)_POST$")>;
333 def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST4i(64)$")>;
334 def : InstRW<[A57Write_3cyc_2S_1V, WriteAdr], (instregex "ST4i(64)_POST$")>;
336 def : InstRW<[A57Write_4cyc_4S_2V], (instregex "ST4Fourv(8b|4h|2s)$")>;
337 def : InstRW<[A57Write_4cyc_4S_2V, WriteAdr], (instregex "ST4Fourv(8b|4h|2s)_POST$")>;
338 def : InstRW<[A57Write_8cyc_8S_4V], (instregex "ST4Fourv(16b|8h|4s)$")>;
339 def : InstRW<[A57Write_8cyc_8S_4V, WriteAdr], (instregex "ST4Fourv(16b|8h|4s)_POST$")>;
340 def : InstRW<[A57Write_8cyc_8S], (instregex "ST4Fourv(2d)$")>;
341 def : InstRW<[A57Write_8cyc_8S, WriteAdr], (instregex "ST4Fourv(2d)_POST$")>;
344 // -----------------------------------------------------------------------------
346 // Reference for forms in this group
347 // D form - v8i8, v4i16, v2i32
348 // Q form - v16i8, v8i16, v4i32
349 // D form - v1i8, v1i16, v1i32, v1i64
350 // Q form - v16i8, v8i16, v4i32, v2i64
351 // D form - v8i8_v8i16, v4i16_v4i32, v2i32_v2i64
352 // Q form - v16i8_v8i16, v8i16_v4i32, v4i32_v2i64
354 // Cortex A57 Software Optimization Guide Sec 3.14
355 // Advance for absolute diff accum, pairwise add and accumulate, shift accumulate
356 def A57ReadIVA3 : SchedReadAdvance<3, [A57Write_4cyc_1X_NonMul_Forward, A57Write_5cyc_2X_NonMul_Forward]>;
358 // ASIMD absolute diff accum, D-form
359 def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABA(v8i8|v4i16|v2i32)$")>;
360 // ASIMD absolute diff accum, Q-form
361 def : InstRW<[A57Write_5cyc_2X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABA(v16i8|v8i16|v4i32)$")>;
362 // ASIMD absolute diff accum long
363 def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABAL")>;
365 // ASIMD arith, reduce, 4H/4S
366 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]?ADDL?V(v8i8|v4i16|v2i32)v$")>;
367 // ASIMD arith, reduce, 8B/8H
368 def : InstRW<[A57Write_7cyc_1V_1X], (instregex "^[SU]?ADDL?V(v8i16|v4i32)v$")>;
369 // ASIMD arith, reduce, 16B
370 def : InstRW<[A57Write_8cyc_2X], (instregex "^[SU]?ADDL?Vv16i8v$")>;
372 // ASIMD max/min, reduce, 4H/4S
373 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU](MIN|MAX)V(v4i16|v4i32)v$")>;
374 // ASIMD max/min, reduce, 8B/8H
375 def : InstRW<[A57Write_7cyc_1V_1X], (instregex "^[SU](MIN|MAX)V(v8i8|v8i16)v$")>;
376 // ASIMD max/min, reduce, 16B
377 def : InstRW<[A57Write_8cyc_2X], (instregex "^[SU](MIN|MAX)Vv16i8v$")>;
379 // ASIMD multiply, D-form
381 def : InstRW<[A57Write_5cyc_1W_Mul_Forward], (instregex "^MUL(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)(_indexed)?$")>;
382 // PMUL, SQDMULH, SQRDMULH
383 def : InstRW<[A57Write_5cyc_1W], (instregex "^(PMUL|SQR?DMULH)(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)(_indexed)?$")>;
385 // ASIMD multiply, Q-form
387 def : InstRW<[A57Write_6cyc_2W_Mul_Forward], (instregex "^MUL(v16i8|v8i16|v4i32)(_indexed)?$")>;
388 // PMUL, SQDMULH, SQRDMULH
389 def : InstRW<[A57Write_6cyc_2W], (instregex "^(PMUL|SQR?DMULH)(v16i8|v8i16|v4i32)(_indexed)?$")>;
391 // Cortex A57 Software Optimization Guide Sec 3.14
392 def A57ReadIVMA4 : SchedReadAdvance<4 , [A57Write_5cyc_1W_Mul_Forward, A57Write_6cyc_2W_Mul_Forward]>;
393 def A57ReadIVMA3 : SchedReadAdvance<3 , [A57Write_5cyc_1W_Mul_Forward, A57Write_6cyc_2W_Mul_Forward]>;
395 // ASIMD multiply accumulate, D-form
396 def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA4], (instregex "^ML[AS](v8i8|v4i16|v2i32)(_indexed)?$")>;
397 // ASIMD multiply accumulate, Q-form
398 def : InstRW<[A57Write_6cyc_2W_Mul_Forward, A57ReadIVMA4], (instregex "^ML[AS](v16i8|v8i16|v4i32)(_indexed)?$")>;
400 // ASIMD multiply accumulate long
401 // ASIMD multiply accumulate saturating long
402 def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA4], (instregex "^(S|U)ML[AS]L")>;
403 def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA3], (instregex "^SQDML[AS]L")>;
405 // ASIMD multiply long
406 def : InstRW<[A57Write_5cyc_1W_Mul_Forward], (instregex "^(S|U)MULL")>;
407 def : InstRW<[A57Write_5cyc_1W], (instregex "^SQDMULL")>;
408 def : InstRW<[A57Write_5cyc_1W], (instregex "^PMULL(v8i8|v16i8)")>;
409 def : InstRW<[A57Write_3cyc_1W], (instregex "^PMULL(v1i64|v2i64)")>;
411 // ASIMD pairwise add and accumulate
412 // ASIMD shift accumulate
413 def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ADALP")>;
414 def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^(S|SR|U|UR)SRA")>;
416 // ASIMD shift by immed, complex
417 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]?(Q|R){1,2}SHR")>;
418 def : InstRW<[A57Write_4cyc_1X], (instregex "^SQSHLU")>;
421 // ASIMD shift by register, basic, Q-form
422 def : InstRW<[A57Write_4cyc_2X], (instregex "^[SU]SHL(v16i8|v8i16|v4i32|v2i64)")>;
424 // ASIMD shift by register, complex, D-form
425 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU][QR]{1,2}SHL(v1i8|v1i16|v1i32|v1i64|v8i8|v4i16|v2i32|b|d|h|s)")>;
427 // ASIMD shift by register, complex, Q-form
428 def : InstRW<[A57Write_5cyc_2X], (instregex "^[SU][QR]{1,2}SHL(v16i8|v8i16|v4i32|v2i64)")>;
431 // Vector - Floating Point
432 // -----------------------------------------------------------------------------
434 // Reference for forms in this group
436 // Q form - v4f32, v2f64
438 // D form - v1i32, v1i64
440 // Q form - v4i32, v2i64
442 // ASIMD FP arith, normal, D-form
443 def : InstRW<[A57Write_5cyc_1V], (instregex "^(FABD|FADD|FSUB)(v2f32|32|64|v2i32p)")>;
444 // ASIMD FP arith, normal, Q-form
445 def : InstRW<[A57Write_5cyc_2V], (instregex "^(FABD|FADD|FSUB)(v4f32|v2f64|v2i64p)")>;
447 // ASIMD FP arith, pairwise, D-form
448 def : InstRW<[A57Write_5cyc_1V], (instregex "^FADDP(v2f32|32|64|v2i32)")>;
449 // ASIMD FP arith, pairwise, Q-form
450 def : InstRW<[A57Write_9cyc_3V], (instregex "^FADDP(v4f32|v2f64|v2i64)")>;
452 // ASIMD FP compare, D-form
453 def : InstRW<[A57Write_5cyc_1V], (instregex "^(FACGE|FACGT|FCMEQ|FCMGE|FCMGT|FCMLE|FCMLT)(v2f32|32|64|v1i32|v2i32|v1i64)")>;
454 // ASIMD FP compare, Q-form
455 def : InstRW<[A57Write_5cyc_2V], (instregex "^(FACGE|FACGT|FCMEQ|FCMGE|FCMGT|FCMLE|FCMLT)(v4f32|v2f64|v4i32|v2i64)")>;
457 // ASIMD FP convert, long and narrow
458 def : InstRW<[A57Write_8cyc_3V], (instregex "^FCVT(L|N|XN)v")>;
459 // ASIMD FP convert, other, D-form
460 def : InstRW<[A57Write_5cyc_1V], (instregex "^[FVSU]CVT([AMNPZ][SU])?(_Int)?(v2f32|v1i32|v2i32|v1i64)")>;
461 // ASIMD FP convert, other, Q-form
462 def : InstRW<[A57Write_5cyc_2V], (instregex "^[FVSU]CVT([AMNPZ][SU])?(_Int)?(v4f32|v2f64|v4i32|v2i64)")>;
464 // ASIMD FP divide, D-form, F32
465 def : InstRW<[A57Write_17cyc_1W], (instregex "FDIVv2f32")>;
466 // ASIMD FP divide, Q-form, F32
467 def : InstRW<[A57Write_34cyc_2W], (instregex "FDIVv4f32")>;
468 // ASIMD FP divide, Q-form, F64
469 def : InstRW<[A57Write_64cyc_2W], (instregex "FDIVv2f64")>;
471 // Note: These were simply duplicated from ASIMD FDIV because of missing documentation
472 // ASIMD FP square root, D-form, F32
473 def : InstRW<[A57Write_17cyc_1W], (instregex "FSQRTv2f32")>;
474 // ASIMD FP square root, Q-form, F32
475 def : InstRW<[A57Write_34cyc_2W], (instregex "FSQRTv4f32")>;
476 // ASIMD FP square root, Q-form, F64
477 def : InstRW<[A57Write_64cyc_2W], (instregex "FSQRTv2f64")>;
479 // ASIMD FP max/min, normal, D-form
480 def : InstRW<[A57Write_5cyc_1V], (instregex "^(FMAX|FMIN)(NM)?(v2f32)")>;
481 // ASIMD FP max/min, normal, Q-form
482 def : InstRW<[A57Write_5cyc_2V], (instregex "^(FMAX|FMIN)(NM)?(v4f32|v2f64)")>;
483 // ASIMD FP max/min, pairwise, D-form
484 def : InstRW<[A57Write_5cyc_1V], (instregex "^(FMAX|FMIN)(NM)?P(v2f32|v2i32)")>;
485 // ASIMD FP max/min, pairwise, Q-form
486 def : InstRW<[A57Write_9cyc_3V], (instregex "^(FMAX|FMIN)(NM)?P(v4f32|v2f64|v2i64)")>;
487 // ASIMD FP max/min, reduce
488 def : InstRW<[A57Write_10cyc_3V], (instregex "^(FMAX|FMIN)(NM)?Vv")>;
490 // ASIMD FP multiply, D-form, FZ
491 def : InstRW<[A57Write_5cyc_1V_FP_Forward], (instregex "^FMULX?(v2f32|v1i32|v2i32|v1i64|32|64)")>;
492 // ASIMD FP multiply, Q-form, FZ
493 def : InstRW<[A57Write_5cyc_2V_FP_Forward], (instregex "^FMULX?(v4f32|v2f64|v4i32|v2i64)")>;
495 // ASIMD FP multiply accumulate, D-form, FZ
496 // ASIMD FP multiply accumulate, Q-form, FZ
497 def A57WriteFPVMAD : SchedWriteRes<[A57UnitV]> { let Latency = 9; }
498 def A57WriteFPVMAQ : SchedWriteRes<[A57UnitV, A57UnitV]> { let Latency = 10; }
500 // Cortex A57 Software Optimization Guide Sec 3.15
501 // Advances from FP mul and mul-accum to mul-accum
502 def A57ReadFPVMA5 : SchedReadAdvance<5, [A57WriteFPVMAD, A57WriteFPVMAQ, A57Write_5cyc_1V_FP_Forward, A57Write_5cyc_2V_FP_Forward]>;
503 def A57ReadFPVMA6 : SchedReadAdvance<6, [A57WriteFPVMAD, A57WriteFPVMAQ, A57Write_5cyc_1V_FP_Forward, A57Write_5cyc_2V_FP_Forward]>;
505 def : InstRW<[A57WriteFPVMAD, A57ReadFPVMA5], (instregex "^FML[AS](v2f32|v1i32|v2i32|v1i64)")>;
506 def : InstRW<[A57WriteFPVMAQ, A57ReadFPVMA6], (instregex "^FML[AS](v4f32|v2f64|v4i32|v2i64)")>;
508 // ASIMD FP round, D-form
509 def : InstRW<[A57Write_5cyc_1V], (instregex "^FRINT[AIMNPXZ](v2f32)")>;
510 // ASIMD FP round, Q-form
511 def : InstRW<[A57Write_5cyc_2V], (instregex "^FRINT[AIMNPXZ](v4f32|v2f64)")>;
514 // Vector - Miscellaneous
515 // -----------------------------------------------------------------------------
517 // Reference for forms in this group
518 // D form - v8i8, v4i16, v2i32
519 // Q form - v16i8, v8i16, v4i32
520 // D form - v1i8, v1i16, v1i32, v1i64
521 // Q form - v16i8, v8i16, v4i32, v2i64
523 // ASIMD bitwise insert, Q-form
524 def : InstRW<[A57Write_3cyc_2V], (instregex "^(BIF|BIT|BSL|BSP)v16i8")>;
526 // ASIMD duplicate, gen reg, D-form and Q-form
527 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^CPY")>;
528 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^DUPv.+gpr")>;
530 // ASIMD move, saturating
531 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]QXTU?N")>;
533 // ASIMD reciprocal estimate, D-form
534 def : InstRW<[A57Write_5cyc_1V], (instregex "^[FU](RECP|RSQRT)(E|X)(v2f32|v1i32|v2i32|v1i64)")>;
535 // ASIMD reciprocal estimate, Q-form
536 def : InstRW<[A57Write_5cyc_2V], (instregex "^[FU](RECP|RSQRT)(E|X)(v2f64|v4f32|v4i32)")>;
538 // ASIMD reciprocal step, D-form, FZ
539 def : InstRW<[A57Write_9cyc_1V], (instregex "^F(RECP|RSQRT)S(v2f32|v1i32|v2i32|v1i64|32|64)")>;
540 // ASIMD reciprocal step, Q-form, FZ
541 def : InstRW<[A57Write_9cyc_2V], (instregex "^F(RECP|RSQRT)S(v2f64|v4f32|v4i32)")>;
543 // ASIMD table lookup, D-form
544 def : InstRW<[A57Write_3cyc_1V], (instregex "^TB[LX]v8i8One")>;
545 def : InstRW<[A57Write_6cyc_2V], (instregex "^TB[LX]v8i8Two")>;
546 def : InstRW<[A57Write_9cyc_3V], (instregex "^TB[LX]v8i8Three")>;
547 def : InstRW<[A57Write_12cyc_4V], (instregex "^TB[LX]v8i8Four")>;
548 // ASIMD table lookup, Q-form
549 def : InstRW<[A57Write_6cyc_3V], (instregex "^TB[LX]v16i8One")>;
550 def : InstRW<[A57Write_9cyc_5V], (instregex "^TB[LX]v16i8Two")>;
551 def : InstRW<[A57Write_12cyc_7V], (instregex "^TB[LX]v16i8Three")>;
552 def : InstRW<[A57Write_15cyc_9V], (instregex "^TB[LX]v16i8Four")>;
554 // ASIMD transfer, element to gen reg
555 def : InstRW<[A57Write_6cyc_1I_1L], (instregex "^[SU]MOVv")>;
557 // ASIMD transfer, gen reg to element
558 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^INSv")>;
560 // ASIMD unzip/zip, Q-form
561 def : InstRW<[A57Write_6cyc_3V], (instregex "^(UZP|ZIP)(1|2)(v16i8|v8i16|v4i32|v2i64)")>;
565 // -----------------------------------------------------------------------------
567 def : InstRW<[A57Write_5cyc_1V], (instregex "^F(ADD|SUB)[DS]rr")>;
569 // Cortex A57 Software Optimization Guide Sec 3.10
570 def A57WriteFPMA : SchedWriteRes<[A57UnitV]> { let Latency = 9; }
571 def A57ReadFPMA5 : SchedReadAdvance<5, [A57WriteFPMA, WriteFMul]>;
572 def A57ReadFPM : SchedReadAdvance<0>;
573 def : InstRW<[A57WriteFPMA, A57ReadFPM, A57ReadFPM, A57ReadFPMA5], (instregex "^FN?M(ADD|SUB)[DS]rrr")>;
575 def : InstRW<[A57Write_10cyc_1L_1V], (instregex "^[FSU]CVT[AMNPZ][SU](_Int)?[SU]?[XW]?[DS]?[rds]i?")>;
576 def : InstRW<[A57Write_10cyc_1L_1V], (instregex "^[SU]CVTF")>;
578 def : InstRW<[A57Write_32cyc_1W], (instrs FDIVDrr)>;
579 def : InstRW<[A57Write_17cyc_1W], (instrs FDIVSrr)>;
581 def : InstRW<[A57Write_5cyc_1V], (instregex "^F(MAX|MIN).+rr")>;
583 def : InstRW<[A57Write_5cyc_1V], (instregex "^FRINT.+r")>;
585 def : InstRW<[A57Write_32cyc_1W], (instrs FSQRTDr)>;
586 def : InstRW<[A57Write_17cyc_1W], (instrs FSQRTSr)>;
588 def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDNPDi)>;
589 def : InstRW<[A57Write_6cyc_2L, WriteLDHi], (instrs LDNPQi)>;
590 def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDNPSi)>;
591 def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDPDi)>;
592 def : InstRW<[A57Write_5cyc_1L, WriteLDHi, WriteAdr], (instrs LDPDpost)>;
593 def : InstRW<[A57Write_5cyc_1L, WriteLDHi, WriteAdr], (instrs LDPDpre)>;
594 def : InstRW<[A57Write_6cyc_2L, WriteLDHi], (instrs LDPQi)>;
595 def : InstRW<[A57Write_6cyc_2L, WriteLDHi, WriteAdr], (instrs LDPQpost)>;
596 def : InstRW<[A57Write_6cyc_2L, WriteLDHi, WriteAdr], (instrs LDPQpre)>;
597 def : InstRW<[A57Write_5cyc_1I_2L, WriteLDHi], (instrs LDPSWi)>;
598 def : InstRW<[A57Write_5cyc_1I_2L, WriteLDHi, WriteAdr], (instrs LDPSWpost)>;
599 def : InstRW<[A57Write_5cyc_1I_2L, WriteLDHi, WriteAdr], (instrs LDPSWpre)>;
600 def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDPSi)>;
601 def : InstRW<[A57Write_5cyc_1L, WriteLDHi, WriteAdr], (instrs LDPSpost)>;
602 def : InstRW<[A57Write_5cyc_1L, WriteLDHi, WriteAdr], (instrs LDPSpre)>;
603 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRBpost)>;
604 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRBpre)>;
605 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRBroW)>;
606 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRBroX)>;
607 def : InstRW<[A57Write_5cyc_1L], (instrs LDRBui)>;
608 def : InstRW<[A57Write_5cyc_1L], (instrs LDRDl)>;
609 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRDpost)>;
610 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRDpre)>;
611 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRDroW)>;
612 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRDroX)>;
613 def : InstRW<[A57Write_5cyc_1L], (instrs LDRDui)>;
614 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRHHroW)>;
615 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRHHroX)>;
616 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRHpost)>;
617 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRHpre)>;
618 def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRHroW)>;
619 def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRHroX)>;
620 def : InstRW<[A57Write_5cyc_1L], (instrs LDRHui)>;
621 def : InstRW<[A57Write_5cyc_1L], (instrs LDRQl)>;
622 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRQpost)>;
623 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRQpre)>;
624 def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRQroW)>;
625 def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRQroX)>;
626 def : InstRW<[A57Write_5cyc_1L], (instrs LDRQui)>;
627 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHWroW)>;
628 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHWroX)>;
629 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHXroW)>;
630 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHXroX)>;
631 def : InstRW<[A57Write_5cyc_1L], (instrs LDRSl)>;
632 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRSpost)>;
633 def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRSpre)>;
634 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRSroW)>;
635 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRSroX)>;
636 def : InstRW<[A57Write_5cyc_1L], (instrs LDRSui)>;
637 def : InstRW<[A57Write_5cyc_1L], (instrs LDURBi)>;
638 def : InstRW<[A57Write_5cyc_1L], (instrs LDURDi)>;
639 def : InstRW<[A57Write_5cyc_1L], (instrs LDURHi)>;
640 def : InstRW<[A57Write_5cyc_1L], (instrs LDURQi)>;
641 def : InstRW<[A57Write_5cyc_1L], (instrs LDURSi)>;
643 def : InstRW<[A57Write_2cyc_2S], (instrs STNPDi)>;
644 def : InstRW<[A57Write_4cyc_1I_4S], (instrs STNPQi)>;
645 def : InstRW<[A57Write_2cyc_2S], (instrs STNPXi)>;
646 def : InstRW<[A57Write_2cyc_2S], (instrs STPDi)>;
647 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPDpost)>;
648 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPDpre)>;
649 def : InstRW<[A57Write_4cyc_1I_4S], (instrs STPQi)>;
650 def : InstRW<[WriteAdr, A57Write_4cyc_1I_4S], (instrs STPQpost)>;
651 def : InstRW<[WriteAdr, A57Write_4cyc_2I_4S], (instrs STPQpre)>;
652 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPSpost)>;
653 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPSpre)>;
654 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPWpost)>;
655 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPWpre)>;
656 def : InstRW<[A57Write_2cyc_2S], (instrs STPXi)>;
657 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPXpost)>;
658 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPXpre)>;
659 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBBpost)>;
660 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBBpre)>;
661 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBpost)>;
662 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRBpre)>;
663 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRBroW)>;
664 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRBroX)>;
665 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRDpost)>;
666 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRDpre)>;
667 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHHpost)>;
668 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHHpre)>;
669 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHHroW)>;
670 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHHroX)>;
671 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHpost)>;
672 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRHpre)>;
673 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHroW)>;
674 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHroX)>;
675 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQpost)>;
676 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STRQpre)>;
677 def : InstRW<[A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQroW)>;
678 def : InstRW<[A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQroX)>;
679 def : InstRW<[A57Write_2cyc_1I_2S], (instrs STRQui)>;
680 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRSpost)>;
681 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRSpre)>;
682 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRWpost)>;
683 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRWpre)>;
684 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRXpost)>;
685 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRXpre)>;
686 def : InstRW<[A57Write_2cyc_2S], (instrs STURQi)>;
688 } // SchedModel = CortexA57Model