1 //===-- PPCScheduleE500mc.td - e500mc Scheduling Defs ------*- tablegen -*-===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file defines the itinerary class data for the Freescale e500mc 32-bit
13 // All information is derived from the "e500mc Core Reference Manual",
14 // Freescale Document Number E500MCRM, Rev. 1, 03/2012.
16 //===----------------------------------------------------------------------===//
17 // Relevant functional units in the Freescale e500mc core:
19 // * Decode & Dispatch
20 // Can dispatch up to 2 instructions per clock cycle to either the GPR Issue
21 // queues (GIQx), FP Issue Queue (FIQ), or Branch issue queue (BIQ).
22 def E500_DIS0 : FuncUnit; // Dispatch stage - insn 1
23 def E500_DIS1 : FuncUnit; // Dispatch stage - insn 2
26 // 6 pipelined execution units: SFX0, SFX1, BU, FPU, LSU, CFX.
27 // Some instructions can only execute in SFX0 but not SFX1.
28 // The CFX has a bypass path, allowing non-divide instructions to execute
29 // while a divide instruction is executed.
30 def E500_SFX0 : FuncUnit; // Simple unit 0
31 def E500_SFX1 : FuncUnit; // Simple unit 1
32 def E500_BU : FuncUnit; // Branch unit
33 def E500_CFX_DivBypass
34 : FuncUnit; // CFX divide bypass path
35 def E500_CFX_0 : FuncUnit; // CFX pipeline
36 def E500_LSU_0 : FuncUnit; // LSU pipeline
37 def E500_FPU_0 : FuncUnit; // FPU pipeline
39 def E500_GPR_Bypass : Bypass;
40 def E500_FPR_Bypass : Bypass;
41 def E500_CR_Bypass : Bypass;
43 def PPCE500mcItineraries : ProcessorItineraries<
44 [E500_DIS0, E500_DIS1, E500_SFX0, E500_SFX1, E500_BU, E500_CFX_DivBypass,
45 E500_CFX_0, E500_LSU_0, E500_FPU_0],
46 [E500_CR_Bypass, E500_GPR_Bypass, E500_FPR_Bypass], [
47 InstrItinData<IIC_IntSimple, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
48 InstrStage<1, [E500_SFX0, E500_SFX1]>],
49 [4, 1, 1], // Latency = 1
51 E500_GPR_Bypass, E500_GPR_Bypass]>,
52 InstrItinData<IIC_IntGeneral, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
53 InstrStage<1, [E500_SFX0, E500_SFX1]>],
54 [4, 1, 1], // Latency = 1
56 E500_GPR_Bypass, E500_GPR_Bypass]>,
57 InstrItinData<IIC_IntISEL, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
58 InstrStage<1, [E500_SFX0, E500_SFX1]>],
59 [4, 1, 1, 1], // Latency = 1
61 E500_GPR_Bypass, E500_GPR_Bypass,
63 InstrItinData<IIC_IntCompare, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
64 InstrStage<1, [E500_SFX0, E500_SFX1]>],
65 [5, 1, 1], // Latency = 1 or 2
67 E500_GPR_Bypass, E500_GPR_Bypass]>,
68 InstrItinData<IIC_IntDivW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
69 InstrStage<1, [E500_CFX_0], 0>,
70 InstrStage<14, [E500_CFX_DivBypass]>],
71 [17, 1, 1], // Latency=4..35, Repeat= 4..35
73 E500_GPR_Bypass, E500_GPR_Bypass]>,
74 InstrItinData<IIC_IntMFFS, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
75 InstrStage<8, [E500_FPU_0]>],
78 InstrItinData<IIC_IntMTFSB0, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
79 InstrStage<8, [E500_FPU_0]>],
80 [11, 1, 1], // Latency = 8
81 [NoBypass, NoBypass, NoBypass]>,
82 InstrItinData<IIC_IntMulHW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
83 InstrStage<1, [E500_CFX_0]>],
84 [7, 1, 1], // Latency = 4, Repeat rate = 1
86 E500_GPR_Bypass, E500_GPR_Bypass]>,
87 InstrItinData<IIC_IntMulHWU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
88 InstrStage<1, [E500_CFX_0]>],
89 [7, 1, 1], // Latency = 4, Repeat rate = 1
91 E500_GPR_Bypass, E500_GPR_Bypass]>,
92 InstrItinData<IIC_IntMulLI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
93 InstrStage<1, [E500_CFX_0]>],
94 [7, 1, 1], // Latency = 4, Repeat rate = 1
96 E500_GPR_Bypass, E500_GPR_Bypass]>,
97 InstrItinData<IIC_IntRotate, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
98 InstrStage<1, [E500_SFX0, E500_SFX1]>],
99 [4, 1, 1], // Latency = 1
101 E500_GPR_Bypass, E500_GPR_Bypass]>,
102 InstrItinData<IIC_IntShift, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
103 InstrStage<1, [E500_SFX0, E500_SFX1]>],
104 [4, 1, 1], // Latency = 1
106 E500_GPR_Bypass, E500_GPR_Bypass]>,
107 InstrItinData<IIC_IntTrapW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
108 InstrStage<2, [E500_SFX0]>],
109 [5, 1], // Latency = 2, Repeat rate = 2
110 [E500_GPR_Bypass, E500_GPR_Bypass]>,
111 InstrItinData<IIC_BrB, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
112 InstrStage<1, [E500_BU]>],
113 [4, 1], // Latency = 1
114 [NoBypass, E500_GPR_Bypass]>,
115 InstrItinData<IIC_BrCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
116 InstrStage<1, [E500_BU]>],
117 [4, 1, 1], // Latency = 1
119 E500_CR_Bypass, E500_CR_Bypass]>,
120 InstrItinData<IIC_BrMCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
121 InstrStage<1, [E500_BU]>],
122 [4, 1], // Latency = 1
123 [E500_CR_Bypass, E500_CR_Bypass]>,
124 InstrItinData<IIC_BrMCRX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
125 InstrStage<1, [E500_SFX0, E500_SFX1]>],
126 [4, 1, 1], // Latency = 1
127 [E500_CR_Bypass, E500_GPR_Bypass]>,
128 InstrItinData<IIC_LdStDCBA, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
129 InstrStage<1, [E500_LSU_0]>],
130 [6, 1], // Latency = 3, Repeat rate = 1
131 [E500_GPR_Bypass, E500_GPR_Bypass]>,
132 InstrItinData<IIC_LdStDCBF, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
133 InstrStage<1, [E500_LSU_0]>],
134 [6, 1], // Latency = 3
135 [E500_GPR_Bypass, E500_GPR_Bypass]>,
136 InstrItinData<IIC_LdStDCBI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
137 InstrStage<1, [E500_LSU_0]>],
138 [6, 1], // Latency = 3
139 [E500_GPR_Bypass, E500_GPR_Bypass]>,
140 InstrItinData<IIC_LdStLoad, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
141 InstrStage<1, [E500_LSU_0]>],
142 [6, 1], // Latency = 3
143 [E500_GPR_Bypass, E500_GPR_Bypass]>,
144 InstrItinData<IIC_LdStLoadUpd, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
145 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
146 InstrStage<1, [E500_LSU_0]>],
147 [6, 1], // Latency = 3
148 [E500_GPR_Bypass, E500_GPR_Bypass],
150 InstrItinData<IIC_LdStLoadUpdX,[InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
151 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
152 InstrStage<1, [E500_LSU_0]>],
153 [6, 1], // Latency = 3
154 [E500_GPR_Bypass, E500_GPR_Bypass],
156 InstrItinData<IIC_LdStStore, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
157 InstrStage<1, [E500_LSU_0]>],
158 [6, 1], // Latency = 3
159 [NoBypass, E500_GPR_Bypass]>,
160 InstrItinData<IIC_LdStStoreUpd,[InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
161 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
162 InstrStage<1, [E500_LSU_0]>],
163 [6, 1], // Latency = 3
164 [NoBypass, E500_GPR_Bypass],
166 InstrItinData<IIC_LdStICBI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
167 InstrStage<1, [E500_LSU_0]>],
168 [6, 1], // Latency = 3
169 [NoBypass, E500_GPR_Bypass]>,
170 InstrItinData<IIC_LdStSTFD, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
171 InstrStage<1, [E500_LSU_0]>],
172 [6, 1, 1], // Latency = 3
174 E500_GPR_Bypass, E500_GPR_Bypass]>,
175 InstrItinData<IIC_LdStSTFDU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
176 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
177 InstrStage<1, [E500_LSU_0]>],
178 [6, 1, 1], // Latency = 3
180 E500_GPR_Bypass, E500_GPR_Bypass],
182 InstrItinData<IIC_LdStLFD, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
183 InstrStage<1, [E500_LSU_0]>],
184 [7, 1, 1], // Latency = 4
186 E500_GPR_Bypass, E500_GPR_Bypass]>,
187 InstrItinData<IIC_LdStLFDU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
188 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
189 InstrStage<1, [E500_LSU_0]>],
190 [7, 1, 1], // Latency = 4
192 E500_GPR_Bypass, E500_GPR_Bypass],
194 InstrItinData<IIC_LdStLFDUX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
195 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
196 InstrStage<1, [E500_LSU_0]>],
197 [7, 1, 1], // Latency = 4
199 E500_GPR_Bypass, E500_GPR_Bypass],
201 InstrItinData<IIC_LdStLHA, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
202 InstrStage<1, [E500_LSU_0]>],
203 [6, 1], // Latency = 3
204 [E500_GPR_Bypass, E500_GPR_Bypass]>,
205 InstrItinData<IIC_LdStLHAU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
206 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
207 InstrStage<1, [E500_LSU_0]>],
208 [6, 1], // Latency = 3
209 [E500_GPR_Bypass, E500_GPR_Bypass]>,
210 InstrItinData<IIC_LdStLHAUX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
211 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
212 InstrStage<1, [E500_LSU_0]>],
213 [6, 1], // Latency = 3
214 [E500_GPR_Bypass, E500_GPR_Bypass]>,
215 InstrItinData<IIC_LdStLMW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
216 InstrStage<1, [E500_LSU_0]>],
217 [7, 1], // Latency = r+3
218 [NoBypass, E500_GPR_Bypass]>,
219 InstrItinData<IIC_LdStLWARX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
220 InstrStage<3, [E500_LSU_0]>],
221 [6, 1, 1], // Latency = 3, Repeat rate = 3
223 E500_GPR_Bypass, E500_GPR_Bypass]>,
224 InstrItinData<IIC_LdStSTWCX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
225 InstrStage<1, [E500_LSU_0]>],
226 [6, 1], // Latency = 3
227 [NoBypass, E500_GPR_Bypass]>,
228 InstrItinData<IIC_LdStSync, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
229 InstrStage<1, [E500_LSU_0]>]>,
230 InstrItinData<IIC_SprMFSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
231 InstrStage<4, [E500_SFX0]>],
233 [E500_GPR_Bypass, E500_GPR_Bypass]>,
234 InstrItinData<IIC_SprMTMSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
235 InstrStage<2, [E500_SFX0, E500_SFX1]>],
236 [5, 1], // Latency = 2, Repeat rate = 4
237 [E500_GPR_Bypass, E500_GPR_Bypass]>,
238 InstrItinData<IIC_SprMTSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
239 InstrStage<1, [E500_SFX0]>],
241 [NoBypass, E500_GPR_Bypass]>,
242 InstrItinData<IIC_SprTLBSYNC, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
243 InstrStage<1, [E500_LSU_0], 0>]>,
244 InstrItinData<IIC_SprMFCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
245 InstrStage<5, [E500_SFX0]>],
247 [E500_GPR_Bypass, E500_CR_Bypass]>,
248 InstrItinData<IIC_SprMFCRF, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
249 InstrStage<5, [E500_SFX0]>],
251 [E500_GPR_Bypass, E500_CR_Bypass]>,
252 InstrItinData<IIC_SprMFPMR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
253 InstrStage<4, [E500_SFX0]>],
254 [7, 1], // Latency = 4, Repeat rate = 4
255 [E500_GPR_Bypass, E500_GPR_Bypass]>,
256 InstrItinData<IIC_SprMFMSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
257 InstrStage<4, [E500_SFX0]>],
258 [7, 1], // Latency = 4, Repeat rate = 4
259 [E500_GPR_Bypass, E500_GPR_Bypass]>,
260 InstrItinData<IIC_SprMFSPR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
261 InstrStage<1, [E500_SFX0, E500_SFX1]>],
262 [4, 1], // Latency = 1, Repeat rate = 1
263 [E500_GPR_Bypass, E500_CR_Bypass]>,
264 InstrItinData<IIC_SprMTPMR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
265 InstrStage<1, [E500_SFX0]>],
266 [4, 1], // Latency = 1, Repeat rate = 1
267 [E500_CR_Bypass, E500_GPR_Bypass]>,
268 InstrItinData<IIC_SprMFTB, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
269 InstrStage<4, [E500_SFX0]>],
270 [7, 1], // Latency = 4, Repeat rate = 4
271 [NoBypass, E500_GPR_Bypass]>,
272 InstrItinData<IIC_SprMTSPR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
273 InstrStage<1, [E500_SFX0, E500_SFX1]>],
274 [4, 1], // Latency = 1, Repeat rate = 1
275 [E500_CR_Bypass, E500_GPR_Bypass]>,
276 InstrItinData<IIC_SprMTSRIN, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
277 InstrStage<1, [E500_SFX0]>],
279 [NoBypass, E500_GPR_Bypass]>,
280 InstrItinData<IIC_FPGeneral, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
281 InstrStage<2, [E500_FPU_0]>],
282 [11, 1, 1], // Latency = 8, Repeat rate = 2
284 E500_FPR_Bypass, E500_FPR_Bypass]>,
285 InstrItinData<IIC_FPAddSub, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
286 InstrStage<4, [E500_FPU_0]>],
287 [13, 1, 1], // Latency = 10, Repeat rate = 4
289 E500_FPR_Bypass, E500_FPR_Bypass]>,
290 InstrItinData<IIC_FPCompare, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
291 InstrStage<2, [E500_FPU_0]>],
292 [11, 1, 1], // Latency = 8, Repeat rate = 2
294 E500_FPR_Bypass, E500_FPR_Bypass]>,
295 InstrItinData<IIC_FPDivD, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
296 InstrStage<68, [E500_FPU_0]>],
297 [71, 1, 1], // Latency = 68, Repeat rate = 68
299 E500_FPR_Bypass, E500_FPR_Bypass]>,
300 InstrItinData<IIC_FPDivS, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
301 InstrStage<38, [E500_FPU_0]>],
302 [41, 1, 1], // Latency = 38, Repeat rate = 38
304 E500_FPR_Bypass, E500_FPR_Bypass]>,
305 InstrItinData<IIC_FPFused, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
306 InstrStage<4, [E500_FPU_0]>],
307 [13, 1, 1, 1], // Latency = 10, Repeat rate = 4
309 E500_FPR_Bypass, E500_FPR_Bypass,
311 InstrItinData<IIC_FPRes, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
312 InstrStage<38, [E500_FPU_0]>],
313 [41, 1], // Latency = 38, Repeat rate = 38
314 [E500_FPR_Bypass, E500_FPR_Bypass]>
317 // ===---------------------------------------------------------------------===//
318 // e500mc machine model for scheduling and other instruction cost heuristics.
320 def PPCE500mcModel : SchedMachineModel {
321 let IssueWidth = 2; // 2 micro-ops are dispatched per cycle.
322 let LoadLatency = 5; // Optimistic load latency assuming bypass.
323 // This is overriden by OperandCycles if the
324 // Itineraries are queried instead.
326 let CompleteModel = 0;
328 let Itineraries = PPCE500mcItineraries;