Add gfx950 mfma instructions to ROCDL dialect (#123361)
[llvm-project.git] / llvm / lib / Target / ARM / ARMScheduleA57WriteRes.td
blob025023c5f41a9e855282e06e72350cf77cd8d368
1 //=- ARMScheduleA57WriteRes.td - ARM Cortex-A57 Write Res ---*- tablegen -*-=//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // Contains all of the Cortex-A57 specific SchedWriteRes types. The approach
10 // below is to define a generic SchedWriteRes for every combination of
11 // latency and microOps. The naming conventions is to use a prefix, one field
12 // for latency, and one or more microOp count/type designators.
13 //   Prefix: A57Write
14 //   Latency: #cyc
15 //   MicroOp Count/Types: #(B|I|M|L|S|X|W|V)
17 // e.g. A57Write_6cyc_1I_6S_4V means the total latency is 6 and there are
18 //      11 micro-ops to be issued as follows: one to I pipe, six to S pipes and
19 //      four to V pipes.
21 //===----------------------------------------------------------------------===//
23 //===----------------------------------------------------------------------===//
24 // Define Generic 1 micro-op types
26 def A57Write_5cyc_1M  : SchedWriteRes<[A57UnitM]> { let Latency = 5;  }
27 def A57Write_5cyc_1V  : SchedWriteRes<[A57UnitV]> { let Latency = 5;  }
28 def A57Write_5cyc_1W  : SchedWriteRes<[A57UnitW]> { let Latency = 5;  }
29 def A57Write_10cyc_1V : SchedWriteRes<[A57UnitV]> { let Latency = 10; }
30 def A57Write_17cyc_1W : SchedWriteRes<[A57UnitW]> { let Latency = 17;
31                                                     let ReleaseAtCycles = [17]; }
32 def A57Write_18cyc_1X : SchedWriteRes<[A57UnitX]> { let Latency = 18;
33                                                     let ReleaseAtCycles = [18]; }
34 def A57Write_19cyc_1M : SchedWriteRes<[A57UnitM]> { let Latency = 19;
35                                                     let ReleaseAtCycles = [19]; }
36 def A57Write_20cyc_1M : SchedWriteRes<[A57UnitM]> { let Latency = 20;
37                                                     let ReleaseAtCycles = [20]; }
38 def A57Write_1cyc_1B  : SchedWriteRes<[A57UnitB]> { let Latency = 1;  }
39 def A57Write_1cyc_1I  : SchedWriteRes<[A57UnitI]> { let Latency = 1;
40                                                     let ReleaseAtCycles = [1]; }
41 def A57Write_2cyc_1I  : SchedWriteRes<[A57UnitI]> { let Latency = 2;
42                                                     let ReleaseAtCycles = [1]; }
43 def A57Write_3cyc_1I  : SchedWriteRes<[A57UnitI]> { let Latency = 3;  }
44 def A57Write_1cyc_1S  : SchedWriteRes<[A57UnitS]> { let Latency = 1;  }
45 def A57Write_2cyc_1S  : SchedWriteRes<[A57UnitS]> { let Latency = 2;  }
46 def A57Write_3cyc_1S  : SchedWriteRes<[A57UnitS]> { let Latency = 3;  }
47 def A57Write_2cyc_1M  : SchedWriteRes<[A57UnitM]> { let Latency = 2;
48                                                     let ReleaseAtCycles = [1]; }
49 def A57Write_32cyc_1W : SchedWriteRes<[A57UnitW]> { let Latency = 32;
50                                                     let ReleaseAtCycles = [32]; }
51 def A57Write_32cyc_1X : SchedWriteRes<[A57UnitX]> { let Latency = 32;
52                                                     let ReleaseAtCycles = [32]; }
53 def A57Write_35cyc_1M : SchedWriteRes<[A57UnitM]> { let Latency = 35;
54                                                     let ReleaseAtCycles = [35]; }
55 def A57Write_3cyc_1M  : SchedWriteRes<[A57UnitM]> { let Latency = 3;  }
56 def A57Write_3cyc_1V  : SchedWriteRes<[A57UnitV]> { let Latency = 3;  }
57 def A57Write_3cyc_1W  : SchedWriteRes<[A57UnitW]> { let Latency = 3;  }
58 def A57Write_3cyc_1X  : SchedWriteRes<[A57UnitX]> { let Latency = 3;  }
60 // A57Write_3cyc_1L - A57Write_20cyc_1L
61 foreach Lat = 3-20 in {
62   def A57Write_#Lat#cyc_1L : SchedWriteRes<[A57UnitL]> {
63     let Latency = Lat;
64   }
67 // A57Write_4cyc_1S - A57Write_16cyc_1S
68 foreach Lat = 4-16 in {
69   def A57Write_#Lat#cyc_1S : SchedWriteRes<[A57UnitS]> {
70     let Latency = Lat;
71   }
74 def A57Write_4cyc_1M  : SchedWriteRes<[A57UnitM]> { let Latency = 4;  }
75 def A57Write_4cyc_1X  : SchedWriteRes<[A57UnitX]> { let Latency = 4;  }
76 def A57Write_4cyc_1W  : SchedWriteRes<[A57UnitW]> { let Latency = 4;  }
77 def A57Write_5cyc_1X  : SchedWriteRes<[A57UnitX]> { let Latency = 5;  }
78 def A57Write_6cyc_1X  : SchedWriteRes<[A57UnitX]> { let Latency = 6;  }
79 def A57Write_6cyc_1W  : SchedWriteRes<[A57UnitW]> { let Latency = 6;  }
80 def A57Write_8cyc_1V  : SchedWriteRes<[A57UnitV]> { let Latency = 8;  }
81 def A57Write_9cyc_1V  : SchedWriteRes<[A57UnitV]> { let Latency = 9;  }
82 def A57Write_6cyc_1M  : SchedWriteRes<[A57UnitM]> { let Latency = 6;  }
83 def A57Write_6cyc_1V  : SchedWriteRes<[A57UnitV]> { let Latency = 6;  }
86 //===----------------------------------------------------------------------===//
87 // Define Generic 2 micro-op types
89 def A57Write_64cyc_2X    : SchedWriteRes<[A57UnitX, A57UnitX]> {
90   let Latency     = 64;
91   let NumMicroOps = 2;
92   let ReleaseAtCycles = [32, 32];
94 def A57Write_6cyc_1I_1L  : SchedWriteRes<[A57UnitI,
95                                           A57UnitL]> {
96   let Latency     = 6;
97   let NumMicroOps = 2;
99 def A57Write_6cyc_1V_1X  : SchedWriteRes<[A57UnitV,
100                                           A57UnitX]> {
101   let Latency     = 6;
102   let NumMicroOps = 2;
104 def A57Write_7cyc_1V_1X  : SchedWriteRes<[A57UnitV,
105                                           A57UnitX]> {
106   let Latency     = 7;
107   let NumMicroOps = 2;
109 def A57Write_8cyc_1L_1V  : SchedWriteRes<[A57UnitL,
110                                           A57UnitV]> {
111   let Latency     = 8;
112   let NumMicroOps = 2;
114 def A57Write_9cyc_1L_1V  : SchedWriteRes<[A57UnitL,
115                                           A57UnitV]> {
116   let Latency     = 9;
117   let NumMicroOps = 2;
119 def A57Write_9cyc_2V     : SchedWriteRes<[A57UnitV, A57UnitV]> {
120   let Latency     = 9;
121   let NumMicroOps = 2;
123 def A57Write_8cyc_2X     : SchedWriteRes<[A57UnitX, A57UnitX]> {
124   let Latency     = 8;
125   let NumMicroOps = 2;
127 def A57Write_6cyc_2L     : SchedWriteRes<[A57UnitL, A57UnitL]> {
128   let Latency     = 6;
129   let NumMicroOps = 2;
131 def A57Write_6cyc_2V     : SchedWriteRes<[A57UnitV, A57UnitV]> {
132   let Latency     = 6;
133   let NumMicroOps = 2;
135 def A57Write_6cyc_2W     : SchedWriteRes<[A57UnitW, A57UnitW]> {
136   let Latency     = 6;
137   let NumMicroOps = 2;
139 def A57Write_5cyc_1I_1L  : SchedWriteRes<[A57UnitI,
140                                           A57UnitL]> {
141   let Latency     = 5;
142   let NumMicroOps = 2;
144 def A57Write_5cyc_1I_1M  : SchedWriteRes<[A57UnitI,
145                                           A57UnitM]> {
146   let Latency     = 5;
147   let NumMicroOps = 2;
149 def A57Write_5cyc_2V     : SchedWriteRes<[A57UnitV, A57UnitV]> {
150   let Latency     = 5;
151   let NumMicroOps = 2;
153 def A57Write_5cyc_2X     : SchedWriteRes<[A57UnitX, A57UnitX]> {
154   let Latency     = 5;
155   let NumMicroOps = 2;
157 def A57Write_10cyc_1L_1V : SchedWriteRes<[A57UnitL,
158                                           A57UnitV]> {
159   let Latency     = 10;
160   let NumMicroOps = 2;
162 def A57Write_10cyc_2V    : SchedWriteRes<[A57UnitV, A57UnitV]> {
163   let Latency     = 10;
164   let NumMicroOps = 2;
166 def A57Write_1cyc_1B_1I  : SchedWriteRes<[A57UnitB,
167                                           A57UnitI]> {
168   let Latency     = 1;
169   let NumMicroOps = 2;
171 def A57Write_1cyc_1I_1S  : SchedWriteRes<[A57UnitI,
172                                           A57UnitS]> {
173   let Latency     = 1;
174   let NumMicroOps = 2;
176 def A57Write_1cyc_1S_1I  : SchedWriteRes<[A57UnitS,
177                                           A57UnitI]> {
178   let Latency     = 1;
179   let NumMicroOps = 2;
181 def A57Write_2cyc_1S_1I  : SchedWriteRes<[A57UnitS,
182                                           A57UnitI]> {
183   let Latency     = 2;
184   let NumMicroOps = 2;
186 def A57Write_3cyc_1S_1I  : SchedWriteRes<[A57UnitS,
187                                           A57UnitI]> {
188   let Latency     = 3;
189   let NumMicroOps = 2;
191 def A57Write_1cyc_1S_1M  : SchedWriteRes<[A57UnitS,
192                                           A57UnitM]> {
193   let Latency     = 1;
194   let NumMicroOps = 2;
196 def A57Write_2cyc_1B_1I  : SchedWriteRes<[A57UnitB,
197                                           A57UnitI]> {
198   let Latency     = 2;
199   let NumMicroOps = 2;
201 def A57Write_3cyc_1B_1I  : SchedWriteRes<[A57UnitB,
202                                           A57UnitI]> {
203   let Latency     = 3;
204   let NumMicroOps = 2;
206 def A57Write_6cyc_1B_1L  : SchedWriteRes<[A57UnitB,
207                                           A57UnitI]> {
208   let Latency     = 6;
209   let NumMicroOps = 2;
211 def A57Write_2cyc_1I_1M  : SchedWriteRes<[A57UnitI,
212                                           A57UnitM]> {
213   let Latency     = 2;
214   let NumMicroOps = 2;
216 def A57Write_2cyc_2S     : SchedWriteRes<[A57UnitS, A57UnitS]> {
217   let Latency     = 2;
218   let NumMicroOps = 2;
220 def A57Write_2cyc_2V     : SchedWriteRes<[A57UnitV, A57UnitV]> {
221   let Latency     = 2;
222   let NumMicroOps = 2;
224 def A57Write_36cyc_2X    : SchedWriteRes<[A57UnitX, A57UnitX]> {
225   let Latency     = 36;
226   let NumMicroOps = 2;
227   let ReleaseAtCycles = [18, 18];
229 def A57Write_3cyc_1I_1M  : SchedWriteRes<[A57UnitI,
230                                           A57UnitM]> {
231   let Latency     = 3;
232   let NumMicroOps = 2;
234 def A57Write_4cyc_1I_1M  : SchedWriteRes<[A57UnitI,
235                                           A57UnitM]> {
236   let Latency     = 4;
237   let NumMicroOps = 2;
240 // A57Write_3cyc_1L_1I - A57Write_20cyc_1L_1I
241 foreach Lat = 3-20 in {
242   def A57Write_#Lat#cyc_1L_1I : SchedWriteRes<[A57UnitL, A57UnitI]> {
243     let Latency = Lat; let NumMicroOps = 2;
244   }
247 def A57Write_3cyc_1I_1S  : SchedWriteRes<[A57UnitI,
248                                           A57UnitS]> {
249   let Latency     = 3;
250   let NumMicroOps = 2;
252 def A57Write_3cyc_1S_1V  : SchedWriteRes<[A57UnitS,
253                                           A57UnitV]> {
254   let Latency     = 3;
255   let NumMicroOps = 2;
257 def A57Write_4cyc_1S_1V  : SchedWriteRes<[A57UnitS,
258                                           A57UnitV]> {
259   let Latency     = 4;
260   let NumMicroOps = 2;
262 def A57Write_3cyc_2V     : SchedWriteRes<[A57UnitV, A57UnitV]> {
263   let Latency     = 3;
264   let NumMicroOps = 2;
267 // A57Write_4cyc_1S_1I - A57Write_16cyc_1S_1I
268 foreach Lat = 4-16 in {
269   def A57Write_#Lat#cyc_1S_1I : SchedWriteRes<[A57UnitS, A57UnitI]> {
270     let Latency = Lat; let NumMicroOps = 2;
271   }
274 def A57Write_4cyc_2X     : SchedWriteRes<[A57UnitX, A57UnitX]> {
275   let Latency     = 4;
276   let NumMicroOps = 2;
280 //===----------------------------------------------------------------------===//
281 // Define Generic 3 micro-op types
283 def A57Write_10cyc_3V       : SchedWriteRes<[A57UnitV, A57UnitV, A57UnitV]> {
284   let Latency     = 10;
285   let NumMicroOps = 3;
287 def A57Write_2cyc_1I_2S     : SchedWriteRes<[A57UnitI,
288                                              A57UnitS, A57UnitS]> {
289   let Latency     = 2;
290   let NumMicroOps = 3;
292 def A57Write_3cyc_1I_1S_1V  : SchedWriteRes<[A57UnitI,
293                                              A57UnitS,
294                                              A57UnitV]> {
295   let Latency     = 3;
296   let NumMicroOps = 3;
298 def A57Write_3cyc_1S_1V_1I  : SchedWriteRes<[A57UnitS,
299                                              A57UnitV,
300                                              A57UnitI]> {
301   let Latency     = 3;
302   let NumMicroOps = 3;
304 def A57Write_4cyc_1S_1V_1I  : SchedWriteRes<[A57UnitS,
305                                              A57UnitV,
306                                              A57UnitI]> {
307   let Latency     = 4;
308   let NumMicroOps = 3;
310 def A57Write_4cyc_1I_1L_1M  : SchedWriteRes<[A57UnitI, A57UnitL, A57UnitM]> {
311   let Latency     = 4;
312   let NumMicroOps = 3;
314 def A57Write_8cyc_1L_1V_1I  : SchedWriteRes<[A57UnitL,
315                                              A57UnitV,
316                                              A57UnitI]> {
317   let Latency     = 8;
318   let NumMicroOps = 3;
320 def A57Write_9cyc_1L_1V_1I  : SchedWriteRes<[A57UnitL,
321                                              A57UnitV,
322                                              A57UnitI]> {
323   let Latency     = 9;
324   let NumMicroOps = 3;