Add gfx950 mfma instructions to ROCDL dialect (#123361)
[llvm-project.git] / llvm / lib / Target / X86 / X86ScheduleAtom.td
blobc92bc97cfb385a0d621fe459e9d94fb7562a9995
1 //===- X86ScheduleAtom.td - X86 Atom Scheduling Definitions -*- tablegen -*-==//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file defines the schedule class data for the Intel Atom
10 // in order (Saltwell-32nm/Bonnell-45nm) processors.
12 //===----------------------------------------------------------------------===//
15 // Scheduling information derived from the "Intel 64 and IA32 Architectures
16 // Optimization Reference Manual", Chapter 13, Section 4.
18 // Atom machine model.
19 def AtomModel : SchedMachineModel {
20   let IssueWidth = 2;  // Allows 2 instructions per scheduling group.
21   let MicroOpBufferSize = 0; // In-order execution, always hide latency.
22   let LoadLatency = 3; // Expected cycles, may be overriden.
23   let HighLatency = 30;// Expected, may be overriden.
25   // On the Atom, the throughput for taken branches is 2 cycles. For small
26   // simple loops, expand by a small factor to hide the backedge cost.
27   let LoopMicroOpBufferSize = 10;
28   let PostRAScheduler = 1;
29   let CompleteModel = 0;
32 let SchedModel = AtomModel in {
34 // Functional Units
35 def AtomPort0 : ProcResource<1>; // ALU: ALU0, shift/rotate, load/store
36                                  // SIMD/FP: SIMD ALU, Shuffle,SIMD/FP multiply, divide
37 def AtomPort1 : ProcResource<1>; // ALU: ALU1, bit processing, jump, and LEA
38                                  // SIMD/FP: SIMD ALU, FP Adder
40 // NOTE: This is for ops that can use EITHER port, not for ops that require BOTH ports.
41 def AtomPort01 : ProcResGroup<[AtomPort0, AtomPort1]>;
43 // Loads are 3 cycles, so ReadAfterLd registers needn't be available until 3
44 // cycles after the memory operand.
45 def : ReadAdvance<ReadAfterLd, 3>;
46 def : ReadAdvance<ReadAfterVecLd, 3>;
47 def : ReadAdvance<ReadAfterVecXLd, 3>;
48 def : ReadAdvance<ReadAfterVecYLd, 3>;
50 def : ReadAdvance<ReadInt2Fpu, 0>;
52 // This multiclass defines the resource usage for variants with and without
53 // folded loads.
54 multiclass AtomWriteResPair<X86FoldableSchedWrite SchedRW,
55                             list<ProcResourceKind> RRPorts,
56                             list<ProcResourceKind> RMPorts,
57                             int RRLat = 1, int RMLat = 1,
58                             list<int> RRRes = [1],
59                             list<int> RMRes = [1],
60                             int RRUOps = 1,
61                             int RMUOps = 1> {
62   // Register variant.
63   def : WriteRes<SchedRW, RRPorts> {
64     let Latency = RRLat;
65     let ReleaseAtCycles = RRRes;
66     let NumMicroOps = RRUOps;
67   }
69   // Memory variant.
70   def : WriteRes<SchedRW.Folded, RMPorts> {
71     let Latency = RMLat;
72     let ReleaseAtCycles = RMRes;
73     let NumMicroOps = RMUOps;
74   }
77 // A folded store needs a cycle on Port0 for the store data.
78 def : WriteRes<WriteRMW, [AtomPort0]>;
80 ////////////////////////////////////////////////////////////////////////////////
81 // Arithmetic.
82 ////////////////////////////////////////////////////////////////////////////////
84 defm : AtomWriteResPair<WriteALU,    [AtomPort01], [AtomPort0]>;
85 defm : AtomWriteResPair<WriteADC,    [AtomPort01], [AtomPort0]>;
87 defm : AtomWriteResPair<WriteIMul8,     [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  7,  7,  [7,7],  [7,7], 3, 3>;
88 defm : AtomWriteResPair<WriteIMul16,    [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  7,  8,  [7,7],  [8,8], 4, 5>;
89 defm : AtomWriteResPair<WriteIMul16Imm, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [6,6],  [7,7], 2, 3>;
90 defm : AtomWriteResPair<WriteIMul16Reg, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [6,6],  [7,7], 2, 3>;
91 defm : AtomWriteResPair<WriteIMul32,    [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [6,6],  [7,7], 3, 4>;
92 defm : AtomWriteResPair<WriteIMul32Imm, [AtomPort0],  [AtomPort0],   5,  5,  [5],  [5]>;
93 defm : AtomWriteResPair<WriteIMul32Reg, [AtomPort0],  [AtomPort0],   5,  5,  [5],  [5]>;
94 defm : AtomWriteResPair<WriteIMul64,    [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 12, 12, [12,12], [12,12], 8, 8>;
95 defm : AtomWriteResPair<WriteIMul64Imm, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 14, 14, [14,14], [14,14], 7, 7>;
96 defm : AtomWriteResPair<WriteIMul64Reg, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 12, 12, [12,12], [12,12], 6, 6>;
97 defm : X86WriteResUnsupported<WriteIMulH>;
98 defm : X86WriteResUnsupported<WriteIMulHLd>;
99 defm : X86WriteResPairUnsupported<WriteMULX32>;
100 defm : X86WriteResPairUnsupported<WriteMULX64>;
102 defm : X86WriteRes<WriteXCHG,        [AtomPort01], 2, [2], 1>;
103 defm : X86WriteRes<WriteBSWAP32,     [AtomPort0], 1, [1], 1>;
104 defm : X86WriteRes<WriteBSWAP64,     [AtomPort0], 1, [1], 1>;
105 defm : AtomWriteResPair<WriteCMPXCHG, [AtomPort01], [AtomPort01], 15, 15, [15]>;
106 defm : X86WriteRes<WriteCMPXCHGRMW,   [AtomPort01, AtomPort0], 1, [1, 1], 1>;
108 defm : AtomWriteResPair<WriteDiv8,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 50, 68, [50,50], [68,68],  9,  9>;
109 defm : AtomWriteResPair<WriteDiv16,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 50, 50, [50,50], [50,50], 12, 12>;
110 defm : AtomWriteResPair<WriteDiv32,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 50, 50, [50,50], [50,50], 12, 12>;
111 defm : AtomWriteResPair<WriteDiv64,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],130,130,[130,130],[130,130], 38, 38>;
112 defm : AtomWriteResPair<WriteIDiv8,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 62, 62, [62,62], [62,62], 26, 26>;
113 defm : AtomWriteResPair<WriteIDiv16, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 62, 62, [62,62], [62,62], 29, 29>;
114 defm : AtomWriteResPair<WriteIDiv32, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 62, 62, [62,62], [62,62], 29, 29>;
115 defm : AtomWriteResPair<WriteIDiv64, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],130,130,[130,130],[130,130], 60, 60>;
117 defm : X86WriteResPairUnsupported<WriteCRC32>;
119 defm : AtomWriteResPair<WriteCMOV,  [AtomPort01], [AtomPort0]>;
120 defm : X86WriteRes<WriteFCMOV, [AtomPort01], 9, [9], 1>; // x87 conditional move.
122 def  : WriteRes<WriteSETCC, [AtomPort01]>;
123 def  : WriteRes<WriteSETCCStore, [AtomPort01]> {
124   let Latency = 2;
125   let ReleaseAtCycles = [2];
127 def  : WriteRes<WriteLAHFSAHF, [AtomPort01]> {
128   let Latency = 2;
129   let ReleaseAtCycles = [2];
131 defm : X86WriteRes<WriteBitTest,         [AtomPort1],  1, [1], 1>;
132 defm : X86WriteRes<WriteBitTestImmLd,    [AtomPort0],  1, [1], 1>;
133 defm : X86WriteRes<WriteBitTestRegLd,    [AtomPort01], 9, [9], 1>;
134 defm : X86WriteRes<WriteBitTestSet,      [AtomPort1],  1, [1], 1>;
135 //defm : X86WriteRes<WriteBitTestSetImmLd, [AtomPort1],  1, [1], 1>;
136 //defm : X86WriteRes<WriteBitTestSetRegLd, [AtomPort1],  1, [1], 1>;
138 // This is for simple LEAs with one or two input operands.
139 def : WriteRes<WriteLEA, [AtomPort1]>;
141 // Bit counts.
142 defm : AtomWriteResPair<WriteBSF, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 16, 16, [16,16], [16,16], 10, 10>;
143 defm : AtomWriteResPair<WriteBSR, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 16, 16, [16,16], [16,16], 10, 10>;
144 defm : X86WriteResPairUnsupported<WritePOPCNT>;
145 defm : X86WriteResPairUnsupported<WriteLZCNT>;
146 defm : X86WriteResPairUnsupported<WriteTZCNT>;
148 // BMI1 BEXTR/BLS, BMI2 BZHI
149 defm : X86WriteResPairUnsupported<WriteBEXTR>;
150 defm : X86WriteResPairUnsupported<WriteBLS>;
151 defm : X86WriteResPairUnsupported<WriteBZHI>;
153 ////////////////////////////////////////////////////////////////////////////////
154 // Integer shifts and rotates.
155 ////////////////////////////////////////////////////////////////////////////////
157 defm : AtomWriteResPair<WriteShift,    [AtomPort0], [AtomPort0]>;
158 defm : AtomWriteResPair<WriteShiftCL,  [AtomPort0], [AtomPort0]>;
159 defm : AtomWriteResPair<WriteRotate,   [AtomPort0], [AtomPort0]>;
160 defm : AtomWriteResPair<WriteRotateCL, [AtomPort0], [AtomPort0]>;
162 defm : X86WriteRes<WriteSHDrri, [AtomPort01], 2, [2], 1>;
163 defm : X86WriteRes<WriteSHDrrcl,[AtomPort01], 2, [2], 1>;
164 defm : X86WriteRes<WriteSHDmri, [AtomPort01], 4, [4], 1>;
165 defm : X86WriteRes<WriteSHDmrcl,[AtomPort01], 4, [4], 1>;
167 ////////////////////////////////////////////////////////////////////////////////
168 // Loads, stores, and moves, not folded with other operations.
169 ////////////////////////////////////////////////////////////////////////////////
171 def : WriteRes<WriteLoad,    [AtomPort0]>;
172 def : WriteRes<WriteStore,   [AtomPort0]>;
173 def : WriteRes<WriteStoreNT, [AtomPort0]>;
174 def : WriteRes<WriteMove,    [AtomPort01]>;
175 defm : X86WriteResUnsupported<WriteVecMaskedGatherWriteback>;
177 // Treat misc copies as a move.
178 def : InstRW<[WriteMove], (instrs COPY)>;
180 ////////////////////////////////////////////////////////////////////////////////
181 // Idioms that clear a register, like xorps %xmm0, %xmm0.
182 // These can often bypass execution ports completely.
183 ////////////////////////////////////////////////////////////////////////////////
185 def : WriteRes<WriteZero,  []>;
187 ////////////////////////////////////////////////////////////////////////////////
188 // Branches don't produce values, so they have no latency, but they still
189 // consume resources. Indirect branches can fold loads.
190 ////////////////////////////////////////////////////////////////////////////////
192 defm : AtomWriteResPair<WriteJump, [AtomPort1], [AtomPort1]>;
194 ////////////////////////////////////////////////////////////////////////////////
195 // Special case scheduling classes.
196 ////////////////////////////////////////////////////////////////////////////////
198 def : WriteRes<WriteSystem,     [AtomPort01]> { let Latency = 100; }
199 def : WriteRes<WriteMicrocoded, [AtomPort01]> { let Latency = 100; }
200 def : WriteRes<WriteFence,      [AtomPort0]>;
202 // Nops don't have dependencies, so there's no actual latency, but we set this
203 // to '1' to tell the scheduler that the nop uses an ALU slot for a cycle.
204 def : WriteRes<WriteNop, [AtomPort01]>;
206 ////////////////////////////////////////////////////////////////////////////////
207 // Floating point. This covers both scalar and vector operations.
208 ////////////////////////////////////////////////////////////////////////////////
210 defm : X86WriteRes<WriteFLD0,       [AtomPort01], 1, [1], 1>;
211 defm : X86WriteRes<WriteFLD1,       [AtomPort01], 6, [6], 1>;
212 def  : WriteRes<WriteFLoad,         [AtomPort0]>;
213 def  : WriteRes<WriteFLoadX,        [AtomPort0]>;
214 defm : X86WriteResUnsupported<WriteFLoadY>;
215 defm : X86WriteResUnsupported<WriteFMaskedLoad>;
216 defm : X86WriteResUnsupported<WriteFMaskedLoadY>;
218 def  : WriteRes<WriteFStore,        [AtomPort0]>;
219 def  : WriteRes<WriteFStoreX,       [AtomPort0]>;
220 defm : X86WriteResUnsupported<WriteFStoreY>;
221 def  : WriteRes<WriteFStoreNT,      [AtomPort0]>;
222 def  : WriteRes<WriteFStoreNTX,     [AtomPort0]>;
223 defm : X86WriteResUnsupported<WriteFStoreNTY>;
224 defm : X86WriteResUnsupported<WriteFMaskedStore32>;
225 defm : X86WriteResUnsupported<WriteFMaskedStore32Y>;
226 defm : X86WriteResUnsupported<WriteFMaskedStore64>;
227 defm : X86WriteResUnsupported<WriteFMaskedStore64Y>;
229 def  : WriteRes<WriteFMove,         [AtomPort01]>;
230 def  : WriteRes<WriteFMoveX,        [AtomPort01]>;
231 defm : X86WriteResUnsupported<WriteFMoveY>;
232 defm : X86WriteResUnsupported<WriteFMoveZ>;
234 defm : X86WriteRes<WriteEMMS,       [AtomPort01], 5, [5], 1>;
236 defm : AtomWriteResPair<WriteFAdd,           [AtomPort1], [AtomPort0,AtomPort1],  5,  5,  [1],  [1,1]>;
237 defm : AtomWriteResPair<WriteFAddX,          [AtomPort1], [AtomPort0,AtomPort1],  5,  5,  [1],  [1,1]>;
238 defm : X86WriteResPairUnsupported<WriteFAddY>;
239 defm : X86WriteResPairUnsupported<WriteFAddZ>;
240 defm : AtomWriteResPair<WriteFAdd64,         [AtomPort1], [AtomPort0,AtomPort1],  5,  5,  [1],  [1,1]>;
241 defm : AtomWriteResPair<WriteFAdd64X,        [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [5,5],  [6,6], 3, 4>;
242 defm : X86WriteResPairUnsupported<WriteFAdd64Y>;
243 defm : X86WriteResPairUnsupported<WriteFAdd64Z>;
244 defm : AtomWriteResPair<WriteFCmp,           [AtomPort1], [AtomPort0,AtomPort1],  5,  5,  [1],  [1,1]>;
245 defm : AtomWriteResPair<WriteFCmpX,          [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [5,5],  [6,6], 3, 4>;
246 defm : X86WriteResPairUnsupported<WriteFCmpY>;
247 defm : X86WriteResPairUnsupported<WriteFCmpZ>;
248 defm : AtomWriteResPair<WriteFCmp64,         [AtomPort1], [AtomPort0,AtomPort1],  5,  5,  [1],  [1,1]>;
249 defm : AtomWriteResPair<WriteFCmp64X,        [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [5,5],  [6,6], 3, 4>;
250 defm : X86WriteResPairUnsupported<WriteFCmp64Y>;
251 defm : X86WriteResPairUnsupported<WriteFCmp64Z>;
252 defm : AtomWriteResPair<WriteFCom,           [AtomPort0],  [AtomPort0],  5,  5,  [5],  [5]>;
253 defm : AtomWriteResPair<WriteFComX,          [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  9, 10,  [9,9],[10,10], 4, 5>;
254 defm : AtomWriteResPair<WriteFMul,           [AtomPort0],  [AtomPort0],  4,  4,  [2],  [2]>;
255 defm : AtomWriteResPair<WriteFMulX,          [AtomPort0],  [AtomPort0],  5,  5,  [2],  [2]>;
256 defm : X86WriteResPairUnsupported<WriteFMulY>;
257 defm : X86WriteResPairUnsupported<WriteFMulZ>;
258 defm : AtomWriteResPair<WriteFMul64,         [AtomPort0],  [AtomPort0],  5,  5,  [2],  [2]>;
259 defm : AtomWriteResPair<WriteFMul64X,        [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  9, 10,  [9,9],[10,10], 6, 7>;
260 defm : X86WriteResPairUnsupported<WriteFMul64Y>;
261 defm : X86WriteResPairUnsupported<WriteFMul64Z>;
262 defm : AtomWriteResPair<WriteFRcp,           [AtomPort0],  [AtomPort0],  4,  4,  [4],  [4]>;
263 defm : AtomWriteResPair<WriteFRcpX,          [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  9, 10,  [9,9], [10,10], 5, 6>;
264 defm : X86WriteResPairUnsupported<WriteFRcpY>;
265 defm : X86WriteResPairUnsupported<WriteFRcpZ>;
266 defm : AtomWriteResPair<WriteFRsqrt,         [AtomPort0],  [AtomPort0],  4,  4,  [4],  [4]>;
267 defm : AtomWriteResPair<WriteFRsqrtX,        [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  9, 10,  [9,9], [10,10], 5, 6>;
268 defm : X86WriteResPairUnsupported<WriteFRsqrtY>;
269 defm : X86WriteResPairUnsupported<WriteFRsqrtZ>;
270 defm : AtomWriteResPair<WriteFDiv,          [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 34, 34, [34,34], [34,34], 3, 4>;
271 defm : AtomWriteResPair<WriteFDivX,         [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 70, 70, [70,70], [70,70], 6, 7>;
272 defm : X86WriteResPairUnsupported<WriteFDivY>;
273 defm : X86WriteResPairUnsupported<WriteFDivZ>;
274 defm : AtomWriteResPair<WriteFDiv64,        [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 62, 62,  [62,62],  [62,62], 3, 4>;
275 defm : AtomWriteResPair<WriteFDiv64X,       [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],125,125,[125,125],[125,125], 6, 7>;
276 defm : X86WriteResPairUnsupported<WriteFDiv64Y>;
277 defm : X86WriteResPairUnsupported<WriteFDiv64Z>;
278 defm : AtomWriteResPair<WriteFSqrt,         [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 34, 34, [34,34], [34,34], 3, 4>;
279 defm : AtomWriteResPair<WriteFSqrtX,        [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 70, 70, [70,70], [70,70], 5, 6>;
280 defm : X86WriteResPairUnsupported<WriteFSqrtY>;
281 defm : X86WriteResPairUnsupported<WriteFSqrtZ>;
282 defm : AtomWriteResPair<WriteFSqrt64,       [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 62, 62,  [62,62],  [62,62], 3, 4>;
283 defm : AtomWriteResPair<WriteFSqrt64X,      [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],125,125,[125,125],[125,125], 5, 6>;
284 defm : X86WriteResPairUnsupported<WriteFSqrt64Y>;
285 defm : X86WriteResPairUnsupported<WriteFSqrt64Z>;
286 defm : AtomWriteResPair<WriteFSqrt80,        [AtomPort0],  [AtomPort0], 71, 71, [71], [71]>;
287 defm : AtomWriteResPair<WriteFSign,          [AtomPort1],  [AtomPort1]>;
288 defm : AtomWriteResPair<WriteFRnd,           [AtomPort0],  [AtomPort0],  5,  5,  [5],  [5]>;
289 defm : X86WriteResPairUnsupported<WriteFRndY>;
290 defm : X86WriteResPairUnsupported<WriteFRndZ>;
291 defm : AtomWriteResPair<WriteFLogic,        [AtomPort01],  [AtomPort0]>;
292 defm : X86WriteResPairUnsupported<WriteFLogicY>;
293 defm : X86WriteResPairUnsupported<WriteFLogicZ>;
294 defm : AtomWriteResPair<WriteFTest,         [AtomPort01],  [AtomPort0]>;
295 defm : X86WriteResPairUnsupported<WriteFTestY>;
296 defm : X86WriteResPairUnsupported<WriteFTestZ>;
297 defm : AtomWriteResPair<WriteFShuffle,       [AtomPort0],  [AtomPort0]>;
298 defm : X86WriteResPairUnsupported<WriteFShuffleY>;
299 defm : X86WriteResPairUnsupported<WriteFShuffleZ>;
300 defm : X86WriteResPairUnsupported<WriteFVarShuffle>;
301 defm : X86WriteResPairUnsupported<WriteFVarShuffleY>;
302 defm : X86WriteResPairUnsupported<WriteFVarShuffleZ>;
303 defm : X86WriteResPairUnsupported<WriteFMA>;
304 defm : X86WriteResPairUnsupported<WriteFMAX>;
305 defm : X86WriteResPairUnsupported<WriteFMAY>;
306 defm : X86WriteResPairUnsupported<WriteFMAZ>;
307 defm : X86WriteResPairUnsupported<WriteDPPD>;
308 defm : X86WriteResPairUnsupported<WriteDPPS>;
309 defm : X86WriteResPairUnsupported<WriteDPPSY>;
310 defm : X86WriteResPairUnsupported<WriteFBlend>;
311 defm : X86WriteResPairUnsupported<WriteFBlendY>;
312 defm : X86WriteResPairUnsupported<WriteFBlendZ>;
313 defm : X86WriteResPairUnsupported<WriteFVarBlend>;
314 defm : X86WriteResPairUnsupported<WriteFVarBlendY>;
315 defm : X86WriteResPairUnsupported<WriteFVarBlendZ>;
316 defm : X86WriteResPairUnsupported<WriteFShuffle256>;
317 defm : X86WriteResPairUnsupported<WriteFVarShuffle256>;
319 ////////////////////////////////////////////////////////////////////////////////
320 // Conversions.
321 ////////////////////////////////////////////////////////////////////////////////
323 defm : AtomWriteResPair<WriteCvtSS2I,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  8,  9,  [8,8],  [9,9], 3, 4>;
324 defm : AtomWriteResPair<WriteCvtPS2I,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [6,6],  [7,7], 3, 4>;
325 defm : X86WriteResPairUnsupported<WriteCvtPS2IY>;
326 defm : X86WriteResPairUnsupported<WriteCvtPS2IZ>;
327 defm : AtomWriteResPair<WriteCvtSD2I,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  8,  9,  [8,8],[10,10], 3, 4>;
328 defm : AtomWriteResPair<WriteCvtPD2I,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  7,  8,  [7,7],  [8,8], 4, 5>;
329 defm : X86WriteResPairUnsupported<WriteCvtPD2IY>;
330 defm : X86WriteResPairUnsupported<WriteCvtPD2IZ>;
332 defm : AtomWriteResPair<WriteCvtI2SS,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [6,6],  [6,6], 3, 1>;
333 defm : AtomWriteResPair<WriteCvtI2PS,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [6,6],  [7,7], 3, 4>;
334 defm : X86WriteResPairUnsupported<WriteCvtI2PSY>;
335 defm : X86WriteResPairUnsupported<WriteCvtI2PSZ>;
336 defm : AtomWriteResPair<WriteCvtI2SD,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [6,6],  [7,7], 3, 3>;
337 defm : AtomWriteResPair<WriteCvtI2PD,   [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  7,  8,  [6,6],  [7,7], 3, 4>;
338 defm : X86WriteResPairUnsupported<WriteCvtI2PDY>;
339 defm : X86WriteResPairUnsupported<WriteCvtI2PDZ>;
341 defm : AtomWriteResPair<WriteCvtSS2SD,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  6,  7,  [6,6],  [7,7], 3, 4>;
342 defm : AtomWriteResPair<WriteCvtPS2PD,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1],  7,  8,  [6,6],  [7,7], 4, 5>;
343 defm : X86WriteResPairUnsupported<WriteCvtPS2PDY>;
344 defm : X86WriteResPairUnsupported<WriteCvtPS2PDZ>;
345 defm : AtomWriteResPair<WriteCvtSD2SS,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 10, 11,[10,10],[12,12], 3, 4>;
346 defm : AtomWriteResPair<WriteCvtPD2PS,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 11, 12,[11,11],[12,12], 4, 5>;
347 defm : X86WriteResPairUnsupported<WriteCvtPD2PSY>;
348 defm : X86WriteResPairUnsupported<WriteCvtPD2PSZ>;
350 defm : X86WriteResPairUnsupported<WriteCvtPH2PS>;
351 defm : X86WriteResPairUnsupported<WriteCvtPH2PSY>;
352 defm : X86WriteResPairUnsupported<WriteCvtPH2PSZ>;
353 defm : X86WriteResUnsupported<WriteCvtPS2PH>;
354 defm : X86WriteResUnsupported<WriteCvtPS2PHSt>;
355 defm : X86WriteResUnsupported<WriteCvtPS2PHY>;
356 defm : X86WriteResUnsupported<WriteCvtPS2PHZ>;
357 defm : X86WriteResUnsupported<WriteCvtPS2PHYSt>;
358 defm : X86WriteResUnsupported<WriteCvtPS2PHZSt>;
360 ////////////////////////////////////////////////////////////////////////////////
361 // Vector integer operations.
362 ////////////////////////////////////////////////////////////////////////////////
364 def  : WriteRes<WriteVecLoad,         [AtomPort0]>;
365 def  : WriteRes<WriteVecLoadX,        [AtomPort0]>;
366 defm : X86WriteResUnsupported<WriteVecLoadY>;
367 def  : WriteRes<WriteVecLoadNT,       [AtomPort0]>;
368 defm : X86WriteResUnsupported<WriteVecLoadNTY>;
369 defm : X86WriteResUnsupported<WriteVecMaskedLoad>;
370 defm : X86WriteResUnsupported<WriteVecMaskedLoadY>;
372 def  : WriteRes<WriteVecStore,        [AtomPort0]>;
373 def  : WriteRes<WriteVecStoreX,       [AtomPort0]>;
374 defm : X86WriteResUnsupported<WriteVecStoreY>;
375 def  : WriteRes<WriteVecStoreNT,      [AtomPort0]>;
376 defm : X86WriteResUnsupported<WriteVecStoreNTY>;
377 defm : X86WriteResUnsupported<WriteVecMaskedStore32>;
378 defm : X86WriteResUnsupported<WriteVecMaskedStore64>;
379 defm : X86WriteResUnsupported<WriteVecMaskedStore32Y>;
380 defm : X86WriteResUnsupported<WriteVecMaskedStore64Y>;
382 def  : WriteRes<WriteVecMove,          [AtomPort0]>;
383 def  : WriteRes<WriteVecMoveX,        [AtomPort01]>;
384 defm : X86WriteResUnsupported<WriteVecMoveY>;
385 defm : X86WriteResUnsupported<WriteVecMoveZ>;
386 defm : X86WriteRes<WriteVecMoveToGpr,   [AtomPort0], 3, [3], 1>;
387 defm : X86WriteRes<WriteVecMoveFromGpr, [AtomPort0], 1, [1], 1>;
389 defm : AtomWriteResPair<WriteVecALU,       [AtomPort01],  [AtomPort0], 1, 1>;
390 defm : AtomWriteResPair<WriteVecALUX,      [AtomPort01],  [AtomPort0], 1, 1>;
391 defm : X86WriteResPairUnsupported<WriteVecALUY>;
392 defm : X86WriteResPairUnsupported<WriteVecALUZ>;
393 defm : AtomWriteResPair<WriteVecLogic,     [AtomPort01],  [AtomPort0], 1, 1>;
394 defm : AtomWriteResPair<WriteVecLogicX,    [AtomPort01],  [AtomPort0], 1, 1>;
395 defm : X86WriteResPairUnsupported<WriteVecLogicY>;
396 defm : X86WriteResPairUnsupported<WriteVecLogicZ>;
397 defm : X86WriteResPairUnsupported<WriteVecTest>;
398 defm : X86WriteResPairUnsupported<WriteVecTestY>;
399 defm : X86WriteResPairUnsupported<WriteVecTestZ>;
400 defm : AtomWriteResPair<WriteVecShift,     [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 2, 3, [1,1], [2,2], 2, 3>;
401 defm : AtomWriteResPair<WriteVecShiftX,    [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 2, 3, [1,1], [2,2], 2, 3>;
402 defm : X86WriteResPairUnsupported<WriteVecShiftY>;
403 defm : X86WriteResPairUnsupported<WriteVecShiftZ>;
404 defm : AtomWriteResPair<WriteVecShiftImm,   [AtomPort0],  [AtomPort0], 1, 1>;
405 defm : AtomWriteResPair<WriteVecShiftImmX,  [AtomPort0],  [AtomPort0], 1, 1>;
406 defm : X86WriteResPairUnsupported<WriteVecShiftImmY>;
407 defm : X86WriteResPairUnsupported<WriteVecShiftImmZ>;
408 defm : AtomWriteResPair<WriteVecIMul,       [AtomPort0],  [AtomPort0], 4, 4, [1], [1]>;
409 defm : AtomWriteResPair<WriteVecIMulX,      [AtomPort0],  [AtomPort0], 5, 5, [2], [2]>;
410 defm : X86WriteResPairUnsupported<WriteVecIMulY>;
411 defm : X86WriteResPairUnsupported<WriteVecIMulZ>;
412 defm : X86WriteResPairUnsupported<WritePMULLD>;
413 defm : X86WriteResPairUnsupported<WritePMULLDY>;
414 defm : X86WriteResPairUnsupported<WritePMULLDZ>;
415 defm : X86WriteResPairUnsupported<WritePHMINPOS>;
416 defm : X86WriteResPairUnsupported<WriteMPSAD>;
417 defm : X86WriteResPairUnsupported<WriteMPSADY>;
418 defm : X86WriteResPairUnsupported<WriteMPSADZ>;
419 defm : AtomWriteResPair<WritePSADBW,        [AtomPort0],  [AtomPort0], 4, 4, [1], [1]>;
420 defm : AtomWriteResPair<WritePSADBWX,       [AtomPort0],  [AtomPort0], 5, 5, [2], [2]>;
421 defm : X86WriteResPairUnsupported<WritePSADBWY>;
422 defm : X86WriteResPairUnsupported<WritePSADBWZ>;
423 defm : AtomWriteResPair<WriteShuffle,       [AtomPort0],  [AtomPort0], 1, 1>;
424 defm : AtomWriteResPair<WriteShuffleX,      [AtomPort0],  [AtomPort0], 1, 1>;
425 defm : X86WriteResPairUnsupported<WriteShuffleY>;
426 defm : X86WriteResPairUnsupported<WriteShuffleZ>;
427 defm : AtomWriteResPair<WriteVarShuffle,    [AtomPort0],  [AtomPort0], 1, 1>;
428 defm : AtomWriteResPair<WriteVarShuffleX,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 4, 5, [3,3], [4,4], 4, 5>;
429 defm : X86WriteResPairUnsupported<WriteVarShuffleY>;
430 defm : X86WriteResPairUnsupported<WriteVarShuffleZ>;
431 defm : X86WriteResPairUnsupported<WriteBlend>;
432 defm : X86WriteResPairUnsupported<WriteBlendY>;
433 defm : X86WriteResPairUnsupported<WriteBlendZ>;
434 defm : X86WriteResPairUnsupported<WriteVarBlend>;
435 defm : X86WriteResPairUnsupported<WriteVarBlendY>;
436 defm : X86WriteResPairUnsupported<WriteVarBlendZ>;
437 defm : X86WriteResPairUnsupported<WriteShuffle256>;
438 defm : X86WriteResPairUnsupported<WriteVPMOV256>;
439 defm : X86WriteResPairUnsupported<WriteVarShuffle256>;
440 defm : X86WriteResPairUnsupported<WriteVarVecShift>;
441 defm : X86WriteResPairUnsupported<WriteVarVecShiftY>;
442 defm : X86WriteResPairUnsupported<WriteVarVecShiftZ>;
444 ////////////////////////////////////////////////////////////////////////////////
445 // Vector insert/extract operations.
446 ////////////////////////////////////////////////////////////////////////////////
448 defm : AtomWriteResPair<WriteVecInsert,     [AtomPort0],  [AtomPort0], 1, 1>;
449 def  : WriteRes<WriteVecExtract,   [AtomPort0]>;
450 def  : WriteRes<WriteVecExtractSt, [AtomPort0]>;
452 ////////////////////////////////////////////////////////////////////////////////
453 // SSE42 String instructions.
454 ////////////////////////////////////////////////////////////////////////////////
456 defm : X86WriteResPairUnsupported<WritePCmpIStrI>;
457 defm : X86WriteResPairUnsupported<WritePCmpIStrM>;
458 defm : X86WriteResPairUnsupported<WritePCmpEStrI>;
459 defm : X86WriteResPairUnsupported<WritePCmpEStrM>;
461 ////////////////////////////////////////////////////////////////////////////////
462 // MOVMSK Instructions.
463 ////////////////////////////////////////////////////////////////////////////////
465 def  : WriteRes<WriteFMOVMSK,    [AtomPort0]> { let Latency = 3; let ReleaseAtCycles = [3]; }
466 def  : WriteRes<WriteVecMOVMSK,  [AtomPort0]> { let Latency = 3; let ReleaseAtCycles = [3]; }
467 defm : X86WriteResUnsupported<WriteVecMOVMSKY>;
468 def  : WriteRes<WriteMMXMOVMSK,  [AtomPort0]> { let Latency = 3; let ReleaseAtCycles = [3]; }
470 ////////////////////////////////////////////////////////////////////////////////
471 // AES instructions.
472 ////////////////////////////////////////////////////////////////////////////////
474 defm : X86WriteResPairUnsupported<WriteAESIMC>;
475 defm : X86WriteResPairUnsupported<WriteAESKeyGen>;
476 defm : X86WriteResPairUnsupported<WriteAESDecEnc>;
478 ////////////////////////////////////////////////////////////////////////////////
479 // Horizontal add/sub  instructions.
480 ////////////////////////////////////////////////////////////////////////////////
482 defm : AtomWriteResPair<WriteFHAdd,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 8, 9, [8,8], [9,9], 5, 6>;
483 defm : X86WriteResPairUnsupported<WriteFHAddY>;
484 defm : AtomWriteResPair<WritePHAdd,  [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 3, 4, [3,3], [4,4], 3, 4>;
485 defm : AtomWriteResPair<WritePHAddX, [AtomPort0,AtomPort1], [AtomPort0,AtomPort1], 7, 8, [7,7], [8,8], 3, 4>;
486 defm : X86WriteResPairUnsupported<WritePHAddY>;
488 ////////////////////////////////////////////////////////////////////////////////
489 // Carry-less multiplication instructions.
490 ////////////////////////////////////////////////////////////////////////////////
492 defm : X86WriteResPairUnsupported<WriteCLMul>;
494 ////////////////////////////////////////////////////////////////////////////////
495 // Load/store MXCSR.
496 ////////////////////////////////////////////////////////////////////////////////
498 defm : X86WriteRes<WriteLDMXCSR, [AtomPort0,AtomPort1],  5,   [5,5], 4>;
499 defm : X86WriteRes<WriteSTMXCSR, [AtomPort0,AtomPort1], 15, [15,15], 4>;
501 ////////////////////////////////////////////////////////////////////////////////
502 // Special Cases.
503 ////////////////////////////////////////////////////////////////////////////////
505 // Port0
506 def AtomWrite0_1 : SchedWriteRes<[AtomPort0]> {
507   let Latency = 1;
508   let ReleaseAtCycles = [1];
510 def : InstRW<[AtomWrite0_1], (instrs XAM_F, LD_Frr,
511                                      MOVSX64rr32)>;
512 def : SchedAlias<WriteALURMW, AtomWrite0_1>;
513 def : SchedAlias<WriteADCRMW, AtomWrite0_1>;
514 def : InstRW<[AtomWrite0_1], (instregex "(RCL|RCR|ROL|ROR|SAR|SHL|SHR)(8|16|32|64)m",
515                                         "MOV(S|Z)X(32|64)rr(8|8_NOREX|16)")>;
517 // Port1
518 def AtomWrite1_1 : SchedWriteRes<[AtomPort1]> {
519   let Latency = 1;
520   let ReleaseAtCycles = [1];
522 def : InstRW<[AtomWrite1_1], (instrs FCOMPP)>;
523 def : InstRW<[AtomWrite1_1], (instregex "UCOM_F(P|PP)?r")>;
525 def AtomWrite1_5 : SchedWriteRes<[AtomPort1]> {
526   let Latency = 5;
527   let ReleaseAtCycles = [5];
529 def : InstRW<[AtomWrite1_5], (instrs MMX_CVTPI2PSrr, MMX_CVTPI2PSrm,
530                                      MMX_CVTPS2PIrr, MMX_CVTTPS2PIrr)>;
532 // Port0 and Port1
533 def AtomWrite0_1_1 : SchedWriteRes<[AtomPort0, AtomPort1]> {
534   let Latency = 1;
535   let ReleaseAtCycles = [1, 1];
537 def : InstRW<[AtomWrite0_1_1], (instrs POP32r, POP64r,
538                                        POP16rmr, POP32rmr, POP64rmr,
539                                        PUSH16r, PUSH32r, PUSH64r,
540                                        PUSH16i, PUSH32i,
541                                        PUSH16rmr, PUSH32rmr, PUSH64rmr,
542                                        PUSH16i8, PUSH32i8, PUSH64i8, PUSH64i32,
543                                        XCH_F)>;
544 def : InstRW<[AtomWrite0_1_1], (instregex "RETI(16|32|64)$",
545                                           "IRET(16|32|64)?")>;
547 def AtomWrite0_1_5 : SchedWriteRes<[AtomPort0, AtomPort1]> {
548   let Latency = 5;
549   let ReleaseAtCycles = [5, 5];
551 def : InstRW<[AtomWrite0_1_5], (instrs MMX_CVTPS2PIrm, MMX_CVTTPS2PIrm)>;
552 def : InstRW<[AtomWrite0_1_5], (instregex "ILD_F(16|32|64)")>;
554 def AtomWrite0_1_7 : SchedWriteRes<[AtomPort0,AtomPort1]> {
555   let Latency = 7;
556   let ReleaseAtCycles = [6,6];
558 def : InstRW<[AtomWrite0_1_7], (instregex "CVTSI642SDrm(_Int)?")>;
560 def AtomWrite0_1_7_4 : SchedWriteRes<[AtomPort0,AtomPort1]> {
561   let Latency = 7;
562   let ReleaseAtCycles = [8,8];
563   let NumMicroOps = 4;
565 def : InstRW<[AtomWrite0_1_7_4], (instregex "CVTSI642SSrr(_Int)?")>;
567 def AtomWrite0_1_8_4 : SchedWriteRes<[AtomPort0,AtomPort1]> {
568   let Latency = 8;
569   let ReleaseAtCycles = [8,8];
570   let NumMicroOps = 4;
572 def : InstRW<[AtomWrite0_1_7_4], (instregex "CVTSI642SSrm(_Int)?")>;
574 def AtomWrite0_1_9 : SchedWriteRes<[AtomPort0,AtomPort1]> {
575   let Latency = 9;
576   let ReleaseAtCycles = [9,9];
577   let NumMicroOps = 4;
579 def : InstRW<[AtomWrite0_1_9], (instregex "CVT(T)?SS2SI64rr(_Int)?")>;
581 def AtomWrite0_1_10 : SchedWriteRes<[AtomPort0,AtomPort1]> {
582   let Latency = 10;
583   let ReleaseAtCycles = [11,11];
584   let NumMicroOps = 5;
586 def : InstRW<[AtomWrite0_1_10], (instregex "CVT(T)?SS2SI64rm(_Int)?")>;
588 // Port0 or Port1
589 def AtomWrite01_1 : SchedWriteRes<[AtomPort01]> {
590   let Latency = 1;
591   let ReleaseAtCycles = [1];
593 def : InstRW<[AtomWrite01_1], (instrs FDECSTP, FFREE, FFREEP, FINCSTP, WAIT,
594                                       LFENCE,
595                                       STOSB, STOSL, STOSQ, STOSW,
596                                       MOVSSrr, MOVSSrr_REV)>;
598 def AtomWrite01_2 : SchedWriteRes<[AtomPort01]> {
599   let Latency = 2;
600   let ReleaseAtCycles = [2];
602 def : InstRW<[AtomWrite01_2], (instrs LEAVE, LEAVE64, POP16r,
603                                       PUSH16rmm, PUSH32rmm, PUSH64rmm,
604                                       LODSB, LODSL, LODSQ, LODSW,
605                                       SCASB, SCASL, SCASQ, SCASW)>;
606 def : InstRW<[AtomWrite01_2], (instregex "PUSH(CS|DS|ES|FS|GS|SS)(16|32|64)",
607                                          "(ST|ISTT)_F(P)?(16|32|64)?(m|rr)",
608                                          "MMX_P(ADD|SUB)Qrr",
609                                          "MOV(S|Z)X16rr8",
610                                          "MOV(UPS|UPD|DQU)mr",
611                                          "MASKMOVDQU(64)?",
612                                          "P(ADD|SUB)Qrr")>;
613 def : SchedAlias<WriteBitTestSetImmRMW, AtomWrite01_2>;
615 def AtomWrite01_3 : SchedWriteRes<[AtomPort01]> {
616   let Latency = 3;
617   let ReleaseAtCycles = [3];
619 def : InstRW<[AtomWrite01_3], (instrs CLD, LDDQUrm,
620                                       CMPSB, CMPSL, CMPSQ, CMPSW,
621                                       MOVSB, MOVSL, MOVSQ, MOVSW,
622                                       POP16rmm, POP32rmm, POP64rmm)>;
623 def : InstRW<[AtomWrite01_3], (instregex "XADD(8|16|32|64)rm",
624                                          "XCHG(8|16|32|64)rm",
625                                          "PH(ADD|SUB)Drr",
626                                          "MOV(S|Z)X16rm8",
627                                          "MMX_P(ADD|SUB)Qrm",
628                                          "MOV(UPS|UPD|DQU)rm",
629                                          "P(ADD|SUB)Qrm")>;
631 def AtomWrite01_4 : SchedWriteRes<[AtomPort01]> {
632   let Latency = 4;
633   let ReleaseAtCycles = [4];
635 def : InstRW<[AtomWrite01_4], (instrs CBW, CWD, CWDE, CDQ, CDQE, CQO,
636                                       JCXZ, JECXZ, JRCXZ,
637                                       LD_F80m)>;
638 def : InstRW<[AtomWrite01_4], (instregex "PH(ADD|SUB)Drm",
639                                          "(MMX_)?PEXTRWrr(_REV)?")>;
641 def AtomWrite01_5 : SchedWriteRes<[AtomPort01]> {
642   let Latency = 5;
643   let ReleaseAtCycles = [5];
645 def : InstRW<[AtomWrite01_5], (instrs FLDCW16m, ST_FP80m)>;
646 def : InstRW<[AtomWrite01_5], (instregex "MMX_PH(ADD|SUB)S?Wrr")>;
648 def AtomWrite01_6 : SchedWriteRes<[AtomPort01]> {
649   let Latency = 6;
650   let ReleaseAtCycles = [6];
652 def : InstRW<[AtomWrite01_6], (instrs CMPXCHG8rm, INTO, XLAT,
653                                       SHLD16rrCL, SHRD16rrCL,
654                                       SHLD16rri8, SHRD16rri8,
655                                       SHLD16mrCL, SHRD16mrCL,
656                                       SHLD16mri8, SHRD16mri8)>;
657 def : InstRW<[AtomWrite01_6], (instregex "IST_F(P)?(16|32|64)?m",
658                                          "MMX_PH(ADD|SUB)S?Wrm")>;
660 def AtomWrite01_7 : SchedWriteRes<[AtomPort01]> {
661   let Latency = 7;
662   let ReleaseAtCycles = [7];
664 def : InstRW<[AtomWrite01_7], (instrs AAD8i8)>;
666 def AtomWrite01_8 : SchedWriteRes<[AtomPort01]> {
667   let Latency = 8;
668   let ReleaseAtCycles = [8];
670 def : InstRW<[AtomWrite01_8], (instrs LOOPE,
671                                       PUSHA16, PUSHA32,
672                                       SHLD64rrCL, SHRD64rrCL,
673                                       FNSTCW16m)>;
675 def AtomWrite01_9 : SchedWriteRes<[AtomPort01]> {
676   let Latency = 9;
677   let ReleaseAtCycles = [9];
679 def : InstRW<[AtomWrite01_9], (instrs POPA16, POPA32,
680                                       PUSHF16, PUSHF32, PUSHF64,
681                                       SHLD64mrCL, SHRD64mrCL,
682                                       SHLD64mri8, SHRD64mri8,
683                                       SHLD64rri8, SHRD64rri8,
684                                       CMPXCHG8rr)>;
685 def : InstRW<[AtomWrite01_9], (instregex "(U)?COM_FI", "TST_F")>;
687 def AtomWrite01_10 : SchedWriteRes<[AtomPort01]> {
688   let Latency = 10;
689   let ReleaseAtCycles = [10];
691 def : SchedAlias<WriteFLDC, AtomWrite01_10>;
693 def AtomWrite01_11 : SchedWriteRes<[AtomPort01]> {
694   let Latency = 11;
695   let ReleaseAtCycles = [11];
697 def : InstRW<[AtomWrite01_11], (instrs BOUNDS16rm, BOUNDS32rm)>;
698 def : SchedAlias<WriteBitTestSetRegRMW, AtomWrite01_11>;
700 def AtomWrite01_13 : SchedWriteRes<[AtomPort01]> {
701   let Latency = 13;
702   let ReleaseAtCycles = [13];
704 def : InstRW<[AtomWrite01_13], (instrs AAA, AAS)>;
706 def AtomWrite01_14 : SchedWriteRes<[AtomPort01]> {
707   let Latency = 14;
708   let ReleaseAtCycles = [14];
710 def : InstRW<[AtomWrite01_14], (instrs CMPXCHG16rm, CMPXCHG32rm, CMPXCHG64rm)>;
712 def AtomWrite01_17 : SchedWriteRes<[AtomPort01]> {
713   let Latency = 17;
714   let ReleaseAtCycles = [17];
716 def : InstRW<[AtomWrite01_17], (instrs LOOPNE, PAUSE)>;
718 def AtomWrite01_18 : SchedWriteRes<[AtomPort01]> {
719   let Latency = 18;
720   let ReleaseAtCycles = [18];
722 def : InstRW<[AtomWrite01_18], (instrs CMPXCHG8B, DAA, LOOP)>;
724 def AtomWrite01_20 : SchedWriteRes<[AtomPort01]> {
725   let Latency = 20;
726   let ReleaseAtCycles = [20];
728 def : InstRW<[AtomWrite01_20], (instrs DAS)>;
730 def AtomWrite01_21 : SchedWriteRes<[AtomPort01]> {
731   let Latency = 21;
732   let ReleaseAtCycles = [21];
734 def : InstRW<[AtomWrite01_21], (instrs AAM8i8, STD)>;
736 def AtomWrite01_22 : SchedWriteRes<[AtomPort01]> {
737   let Latency = 22;
738   let ReleaseAtCycles = [22];
740 def : InstRW<[AtomWrite01_22], (instrs CMPXCHG16B)>;
742 def AtomWrite01_23 : SchedWriteRes<[AtomPort01]> {
743   let Latency = 23;
744   let ReleaseAtCycles = [23];
746 def : InstRW<[AtomWrite01_23], (instrs ARPL16mr, ARPL16rr)>;
748 def AtomWrite01_25 : SchedWriteRes<[AtomPort01]> {
749   let Latency = 25;
750   let ReleaseAtCycles = [25];
752 def : InstRW<[AtomWrite01_25], (instrs FNCLEX, FXTRACT)>;
754 def AtomWrite01_26 : SchedWriteRes<[AtomPort01]> {
755   let Latency = 26;
756   let ReleaseAtCycles = [26];
758 def : InstRW<[AtomWrite01_26], (instrs POPF32, POPF64)>;
760 def AtomWrite01_29 : SchedWriteRes<[AtomPort01]> {
761   let Latency = 29;
762   let ReleaseAtCycles = [29];
764 def : InstRW<[AtomWrite01_29], (instregex "POP(DS|ES|FS|GS)(16|32|64)")>;
766 def AtomWrite01_30 : SchedWriteRes<[AtomPort01]> {
767   let Latency = 30;
768   let ReleaseAtCycles = [30];
770 def : InstRW<[AtomWrite01_30], (instrs RDTSC, RDTSCP)>;
772 def AtomWrite01_32 : SchedWriteRes<[AtomPort01]> {
773   let Latency = 32;
774   let ReleaseAtCycles = [32];
776 def : InstRW<[AtomWrite01_32], (instrs ENTER, POPF16)>;
778 def AtomWrite01_45 : SchedWriteRes<[AtomPort01]> {
779   let Latency = 45;
780   let ReleaseAtCycles = [45];
782 def : InstRW<[AtomWrite01_45], (instrs MONITOR32rrr, MONITOR64rrr)>;
784 def AtomWrite01_46 : SchedWriteRes<[AtomPort01]> {
785   let Latency = 46;
786   let ReleaseAtCycles = [46];
788 def : InstRW<[AtomWrite01_46], (instrs FRNDINT, MWAITrr, RDPMC)>;
790 def AtomWrite01_48 : SchedWriteRes<[AtomPort01]> {
791   let Latency = 48;
792   let ReleaseAtCycles = [48];
794 def : InstRW<[AtomWrite01_48], (instrs POPSS16, POPSS32)>;
796 def AtomWrite01_55 : SchedWriteRes<[AtomPort01]> {
797   let Latency = 55;
798   let ReleaseAtCycles = [55];
800 def : InstRW<[AtomWrite01_55], (instrs FPREM)>;
802 def AtomWrite01_59 : SchedWriteRes<[AtomPort01]> {
803   let Latency = 59;
804   let ReleaseAtCycles = [59];
806 def : InstRW<[AtomWrite01_59], (instrs INSB, INSL, INSW)>;
808 def AtomWrite01_63 : SchedWriteRes<[AtomPort01]> {
809   let Latency = 63;
810   let ReleaseAtCycles = [63];
812 def : InstRW<[AtomWrite01_63], (instrs FNINIT)>;
814 def AtomWrite01_68 : SchedWriteRes<[AtomPort01]> {
815   let Latency = 68;
816   let ReleaseAtCycles = [68];
818 def : InstRW<[AtomWrite01_68], (instrs OUT8rr, OUT16rr, OUT32rr)>;
820 def AtomWrite01_71 : SchedWriteRes<[AtomPort01]> {
821   let Latency = 71;
822   let ReleaseAtCycles = [71];
824 def : InstRW<[AtomWrite01_71], (instrs FPREM1,
825                                        INVLPG, INVLPGA32, INVLPGA64)>;
827 def AtomWrite01_72 : SchedWriteRes<[AtomPort01]> {
828   let Latency = 72;
829   let ReleaseAtCycles = [72];
831 def : InstRW<[AtomWrite01_72], (instrs OUT8ir, OUT16ir, OUT32ir)>;
833 def AtomWrite01_74 : SchedWriteRes<[AtomPort01]> {
834   let Latency = 74;
835   let ReleaseAtCycles = [74];
837 def : InstRW<[AtomWrite01_74], (instrs OUTSB, OUTSL, OUTSW)>;
839 def AtomWrite01_77 : SchedWriteRes<[AtomPort01]> {
840   let Latency = 77;
841   let ReleaseAtCycles = [77];
843 def : InstRW<[AtomWrite01_77], (instrs FSCALE)>;
845 def AtomWrite01_78 : SchedWriteRes<[AtomPort01]> {
846   let Latency = 78;
847   let ReleaseAtCycles = [78];
849 def : InstRW<[AtomWrite01_78], (instrs RDMSR)>;
851 def AtomWrite01_79 : SchedWriteRes<[AtomPort01]> {
852   let Latency = 79;
853   let ReleaseAtCycles = [79];
855 def : InstRW<[AtomWrite01_79], (instregex "RET(16|32|64)?$",
856                                           "LRETI?(16|32|64)")>;
858 def AtomWrite01_92 : SchedWriteRes<[AtomPort01]> {
859   let Latency = 92;
860   let ReleaseAtCycles = [92];
862 def : InstRW<[AtomWrite01_92], (instrs IN8ri, IN16ri, IN32ri)>;
864 def AtomWrite01_94 : SchedWriteRes<[AtomPort01]> {
865   let Latency = 94;
866   let ReleaseAtCycles = [94];
868 def : InstRW<[AtomWrite01_94], (instrs IN8rr, IN16rr, IN32rr)>;
870 def AtomWrite01_99 : SchedWriteRes<[AtomPort01]> {
871   let Latency = 99;
872   let ReleaseAtCycles = [99];
874 def : InstRW<[AtomWrite01_99], (instrs F2XM1)>;
876 def AtomWrite01_121 : SchedWriteRes<[AtomPort01]> {
877   let Latency = 121;
878   let ReleaseAtCycles = [121];
880 def : InstRW<[AtomWrite01_121], (instrs CPUID)>;
882 def AtomWrite01_127 : SchedWriteRes<[AtomPort01]> {
883   let Latency = 127;
884   let ReleaseAtCycles = [127];
886 def : InstRW<[AtomWrite01_127], (instrs INT)>;
888 def AtomWrite01_130 : SchedWriteRes<[AtomPort01]> {
889   let Latency = 130;
890   let ReleaseAtCycles = [130];
892 def : InstRW<[AtomWrite01_130], (instrs INT3)>;
894 def AtomWrite01_140 : SchedWriteRes<[AtomPort01]> {
895   let Latency = 140;
896   let ReleaseAtCycles = [140];
898 def : InstRW<[AtomWrite01_140], (instrs FXSAVE, FXSAVE64)>;
900 def AtomWrite01_141 : SchedWriteRes<[AtomPort01]> {
901   let Latency = 141;
902   let ReleaseAtCycles = [141];
904 def : InstRW<[AtomWrite01_141], (instrs FXRSTOR, FXRSTOR64)>;
906 def AtomWrite01_146 : SchedWriteRes<[AtomPort01]> {
907   let Latency = 146;
908   let ReleaseAtCycles = [146];
910 def : InstRW<[AtomWrite01_146], (instrs FYL2X)>;
912 def AtomWrite01_147 : SchedWriteRes<[AtomPort01]> {
913   let Latency = 147;
914   let ReleaseAtCycles = [147];
916 def : InstRW<[AtomWrite01_147], (instrs FYL2XP1)>;
918 def AtomWrite01_168 : SchedWriteRes<[AtomPort01]> {
919   let Latency = 168;
920   let ReleaseAtCycles = [168];
922 def : InstRW<[AtomWrite01_168], (instrs FPTAN)>;
924 def AtomWrite01_174 : SchedWriteRes<[AtomPort01]> {
925   let Latency = 174;
926   let ReleaseAtCycles = [174];
928 def : InstRW<[AtomWrite01_174], (instrs FSINCOS, FSIN, FCOS)>;
930 def AtomWrite01_183 : SchedWriteRes<[AtomPort01]> {
931   let Latency = 183;
932   let ReleaseAtCycles = [183];
934 def : InstRW<[AtomWrite01_183], (instrs FPATAN)>;
936 def AtomWrite01_202 : SchedWriteRes<[AtomPort01]> {
937   let Latency = 202;
938   let ReleaseAtCycles = [202];
940 def : InstRW<[AtomWrite01_202], (instrs WRMSR)>;
942 } // SchedModel