1 //=- X86SchedSapphireRapids.td - X86 SapphireRapids Scheduling *- tablegen -*=//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file defines the machine model for SapphireRapids to support instruction
10 // scheduling and other instruction cost heuristics.
12 //===----------------------------------------------------------------------===//
14 def SapphireRapidsModel : SchedMachineModel {
15 // SapphireRapids can allocate 6 uops per cycle.
16 let IssueWidth = 6; // Based on allocator width.
17 let MicroOpBufferSize = 512; // Based on the reorder buffer.
19 let MispredictPenalty = 14;
21 // Latency for microcoded instructions or instructions without latency info.
24 // Based on the LSD (loop-stream detector) queue size (ST).
25 let LoopMicroOpBufferSize = 72;
27 // This flag is set to allow the scheduler to assign a default model to
28 // unrecognized opcodes.
29 let CompleteModel = 0;
32 let SchedModel = SapphireRapidsModel in {
34 // SapphireRapids can issue micro-ops to 12 different ports in one cycle.
35 def SPRPort00 : ProcResource<1>;
36 def SPRPort01 : ProcResource<1>;
37 def SPRPort02 : ProcResource<1>;
38 def SPRPort03 : ProcResource<1>;
39 def SPRPort04 : ProcResource<1>;
40 def SPRPort05 : ProcResource<1>;
41 def SPRPort06 : ProcResource<1>;
42 def SPRPort07 : ProcResource<1>;
43 def SPRPort08 : ProcResource<1>;
44 def SPRPort09 : ProcResource<1>;
45 def SPRPort10 : ProcResource<1>;
46 def SPRPort11 : ProcResource<1>;
48 // Workaround to represent invalid ports. WriteRes shouldn't use this resource.
49 def SPRPortInvalid :ProcResource<1>;
51 // Many micro-ops are capable of issuing on multiple ports.
52 def SPRPort00_01 : ProcResGroup<[SPRPort00, SPRPort01]>;
53 def SPRPort00_01_05 : ProcResGroup<[SPRPort00, SPRPort01, SPRPort05]>;
54 def SPRPort00_01_05_06 : ProcResGroup<[SPRPort00, SPRPort01, SPRPort05, SPRPort06]>;
55 def SPRPort00_05 : ProcResGroup<[SPRPort00, SPRPort05]>;
56 def SPRPort00_05_06 : ProcResGroup<[SPRPort00, SPRPort05, SPRPort06]>;
57 def SPRPort00_06 : ProcResGroup<[SPRPort00, SPRPort06]>;
58 def SPRPort01_05 : ProcResGroup<[SPRPort01, SPRPort05]>;
59 def SPRPort01_05_10 : ProcResGroup<[SPRPort01, SPRPort05, SPRPort10]>;
60 def SPRPort02_03 : ProcResGroup<[SPRPort02, SPRPort03]>;
61 def SPRPort02_03_11 : ProcResGroup<[SPRPort02, SPRPort03, SPRPort11]>;
62 def SPRPort07_08 : ProcResGroup<[SPRPort07, SPRPort08]>;
64 // EU has 112 reservation stations.
65 def SPRPort00_01_05_06_10 : ProcResGroup<[SPRPort00, SPRPort01, SPRPort05,
66 SPRPort06, SPRPort10]> {
70 // STD has 48 reservation stations.
71 def SPRPort04_09 : ProcResGroup<[SPRPort04, SPRPort09]> {
75 // MEM has 72 reservation stations.
76 def SPRPort02_03_07_08_11 : ProcResGroup<[SPRPort02, SPRPort03, SPRPort07,
77 SPRPort08, SPRPort11]> {
81 // Integer loads are 5 cycles, so ReadAfterLd registers needn't be available
82 // until 5 cycles after the memory operand.
83 def : ReadAdvance<ReadAfterLd, 5>;
85 // Vector loads are 6 cycles, so ReadAfterVec*Ld registers needn't be available
86 // until 6 cycles after the memory operand.
87 def : ReadAdvance<ReadAfterVecLd, 6>;
88 def : ReadAdvance<ReadAfterVecXLd, 6>;
89 def : ReadAdvance<ReadAfterVecYLd, 6>;
91 def : ReadAdvance<ReadInt2Fpu, 0>;
93 // Many SchedWrites are defined in pairs with and without a folded load.
94 // Instructions with folded loads are usually micro-fused, so they only appear
95 // as two micro-ops when queued in the reservation station.
96 // This multiclass defines the resource usage for variants with and without
98 multiclass SPRWriteResPair<X86FoldableSchedWrite SchedRW,
99 list<ProcResourceKind> ExePorts,
100 int Lat, list<int> Res = [1], int UOps = 1,
101 int LoadLat = 5, int LoadUOps = 1> {
102 // Register variant is using a single cycle on ExePort.
103 def : WriteRes<SchedRW, ExePorts> {
105 let ReleaseAtCycles = Res;
106 let NumMicroOps = UOps;
109 // Memory variant also uses a cycle on port 2/3/11 and adds LoadLat cycles to
110 // the latency (default = 5).
111 def : WriteRes<SchedRW.Folded, !listconcat([SPRPort02_03_11], ExePorts)> {
112 let Latency = !add(Lat, LoadLat);
113 let ReleaseAtCycles = !listconcat([1], Res);
114 let NumMicroOps = !add(UOps, LoadUOps);
118 //===----------------------------------------------------------------------===//
119 // The following definitons are infered by smg.
120 //===----------------------------------------------------------------------===//
122 // Infered SchedWrite definition.
123 def : WriteRes<WriteADC, [SPRPort00_06]>;
124 defm : X86WriteRes<WriteADCLd, [SPRPort00_01_05_06_10, SPRPort00_06], 11, [1, 1], 2>;
125 defm : SPRWriteResPair<WriteAESDecEnc, [SPRPort00_01], 5, [1], 1, 7>;
126 defm : SPRWriteResPair<WriteAESIMC, [SPRPort00_01], 8, [2], 2, 7>;
127 defm : X86WriteRes<WriteAESKeyGen, [SPRPort00, SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort01_05, SPRPort05], 7, [4, 1, 1, 2, 3, 3], 14>;
128 defm : X86WriteRes<WriteAESKeyGenLd, [SPRPort00, SPRPort00_01, SPRPort00_06, SPRPort01_05, SPRPort02_03_11, SPRPort05], 12, [4, 1, 2, 3, 1, 3], 14>;
129 def : WriteRes<WriteALU, [SPRPort00_01_05_06_10]>;
130 def : WriteRes<WriteALULd, [SPRPort00_01_05_06_10]> {
133 defm : SPRWriteResPair<WriteBEXTR, [SPRPort00_06, SPRPort01], 6, [1, 1], 2>;
134 defm : SPRWriteResPair<WriteBLS, [SPRPort01_05_10], 2, [1]>;
135 defm : SPRWriteResPair<WriteBSF, [SPRPort01], 3, [1]>;
136 defm : SPRWriteResPair<WriteBSR, [SPRPort01], 3, [1]>;
137 def : WriteRes<WriteBSWAP32, [SPRPort01]>;
138 defm : X86WriteRes<WriteBSWAP64, [SPRPort00_06, SPRPort01], 2, [1, 1], 2>;
139 defm : SPRWriteResPair<WriteBZHI, [SPRPort01], 3, [1]>;
140 def : WriteRes<WriteBitTest, [SPRPort01]>;
141 defm : X86WriteRes<WriteBitTestImmLd, [SPRPort01, SPRPort02_03_11], 6, [1, 1], 2>;
142 defm : X86WriteRes<WriteBitTestRegLd, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort02_03_11], 11, [4, 2, 1, 2, 1], 10>;
143 def : WriteRes<WriteBitTestSet, [SPRPort01]>;
144 def : WriteRes<WriteBitTestSetImmLd, [SPRPort01]> {
147 defm : X86WriteRes<WriteBitTestSetRegLd, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10], 17, [3, 2, 1, 2], 8>;
148 defm : SPRWriteResPair<WriteBlend, [SPRPort01_05], 1, [1], 1, 7>;
149 defm : SPRWriteResPair<WriteBlendY, [SPRPort00_01_05], 1, [1], 1, 8>;
150 defm : SPRWriteResPair<WriteCLMul, [SPRPort05], 3, [1], 1, 7>;
151 defm : SPRWriteResPair<WriteCMOV, [SPRPort00_06], 1, [1], 1, 6>;
152 defm : X86WriteRes<WriteCMPXCHG, [SPRPort00_01_05_06_10, SPRPort00_06], 3, [3, 2], 5>;
153 defm : X86WriteRes<WriteCMPXCHGRMW, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort02_03_11, SPRPort04_09, SPRPort07_08], 12, [1, 2, 1, 1, 1], 6>;
154 defm : SPRWriteResPair<WriteCRC32, [SPRPort01], 3, [1]>;
155 defm : X86WriteRes<WriteCvtI2PD, [SPRPort00_01, SPRPort05], 5, [1, 1], 2>;
156 defm : X86WriteRes<WriteCvtI2PDLd, [SPRPort00_01, SPRPort02_03_11], 11, [1, 1], 2>;
157 defm : X86WriteRes<WriteCvtI2PDY, [SPRPort00_01, SPRPort05], 7, [1, 1], 2>;
158 defm : X86WriteRes<WriteCvtI2PDYLd, [SPRPort00_01, SPRPort02_03_11], 12, [1, 1], 2>;
159 defm : SPRWriteResPair<WriteCvtI2PDZ, [SPRPort00], 4, [1], 1, 8>;
160 defm : SPRWriteResPair<WriteCvtI2PS, [SPRPort00_01], 4, [1], 1, 7>;
161 defm : SPRWriteResPair<WriteCvtI2PSY, [SPRPort00_01], 4, [1], 1, 8>;
162 defm : SPRWriteResPair<WriteCvtI2PSZ, [SPRPort00], 4, [1], 1, 8>;
163 defm : X86WriteRes<WriteCvtI2SD, [SPRPort00_01, SPRPort05], 7, [1, 1], 2>;
164 defm : X86WriteRes<WriteCvtI2SDLd, [SPRPort00_01, SPRPort02_03_11], 11, [1, 1], 2>;
165 defm : X86WriteRes<WriteCvtI2SS, [SPRPort00_01, SPRPort00_01_05, SPRPort05], 9, [1, 1, 1], 3>;
166 defm : X86WriteRes<WriteCvtI2SSLd, [SPRPort00_01, SPRPort02_03_11], 11, [1, 1], 2>;
167 defm : X86WriteRes<WriteCvtPD2I, [SPRPort00_01, SPRPort05], 5, [1, 1], 2>;
168 defm : X86WriteRes<WriteCvtPD2ILd, [SPRPort00_01, SPRPort02_03_11], 12, [1, 1], 2>;
169 defm : X86WriteRes<WriteCvtPD2IY, [SPRPort00_01, SPRPort05], 7, [1, 1], 2>;
170 defm : X86WriteRes<WriteCvtPD2IYLd, [SPRPort00_01, SPRPort02_03_11], 12, [1, 1], 2>;
171 defm : X86WriteRes<WriteCvtPD2IZ, [SPRPort00, SPRPort05], 7, [1, 1], 2>;
172 defm : X86WriteRes<WriteCvtPD2IZLd, [SPRPort00, SPRPort02_03_11], 12, [1, 1], 2>;
173 defm : SPRWriteResPair<WriteCvtPD2PS, [SPRPort00_01, SPRPort05], 5, [1, 1], 2, 7>;
174 defm : SPRWriteResPair<WriteCvtPD2PSY, [SPRPort00_01, SPRPort05], 7, [1, 1], 2, 8>;
175 defm : SPRWriteResPair<WriteCvtPD2PSZ, [SPRPort00, SPRPort05], 7, [1, 1], 2, 8>;
176 defm : X86WriteRes<WriteCvtPH2PS, [SPRPort00_01, SPRPort05], 6, [1, 1], 2>;
177 defm : X86WriteRes<WriteCvtPH2PSLd, [SPRPort00_01, SPRPort02_03_11], 12, [1, 1], 2>;
178 defm : X86WriteRes<WriteCvtPH2PSY, [SPRPort00_01, SPRPort05], 8, [1, 1], 2>;
179 defm : X86WriteRes<WriteCvtPH2PSYLd, [SPRPort00_01, SPRPort02_03_11], 12, [1, 1], 2>;
180 defm : SPRWriteResPair<WriteCvtPH2PSZ, [SPRPort00, SPRPort05], 11, [1, 1], 2>;
181 defm : SPRWriteResPair<WriteCvtPS2I, [SPRPort00_01], 4, [1], 1, 7>;
182 defm : SPRWriteResPair<WriteCvtPS2IY, [SPRPort00_01], 4, [1], 1, 8>;
183 defm : X86WriteRes<WriteCvtPS2IZ, [SPRPort00, SPRPort00_05, SPRPort05], 10, [1, 2, 1], 4>;
184 defm : X86WriteRes<WriteCvtPS2IZLd, [SPRPort00, SPRPort00_05, SPRPort00_06, SPRPort02_03_11, SPRPort05], 18, [1, 2, 1, 1, 1], 6>;
185 defm : X86WriteRes<WriteCvtPS2PD, [SPRPort00_01, SPRPort05], 5, [1, 1], 2>;
186 defm : X86WriteRes<WriteCvtPS2PDLd, [SPRPort00_01, SPRPort02_03_11], 11, [1, 1], 2>;
187 defm : X86WriteRes<WriteCvtPS2PDY, [SPRPort00_01, SPRPort05], 7, [1, 1], 2>;
188 defm : X86WriteRes<WriteCvtPS2PDYLd, [SPRPort00_01, SPRPort02_03_11], 12, [1, 1], 2>;
189 defm : SPRWriteResPair<WriteCvtPS2PDZ, [SPRPort00, SPRPort05], 7, [1, 1], 2, 6>;
190 defm : X86WriteRes<WriteCvtPS2PH, [SPRPort00_01, SPRPort05], 6, [1, 1], 2>;
191 defm : X86WriteRes<WriteCvtPS2PHSt, [SPRPort00_01, SPRPort04_09, SPRPort07_08], 12, [1, 1, 1], 3>;
192 defm : X86WriteRes<WriteCvtPS2PHY, [SPRPort00_01, SPRPort05], 8, [1, 1], 2>;
193 defm : X86WriteRes<WriteCvtPS2PHYSt, [SPRPort00_01, SPRPort04_09, SPRPort07_08], 12, [1, 1, 1], 3>;
194 defm : X86WriteRes<WriteCvtPS2PHZ, [SPRPort00, SPRPort05], 11, [1, 1], 2>;
195 defm : X86WriteRes<WriteCvtPS2PHZSt, [SPRPort00, SPRPort04_09, SPRPort07_08], 12, [1, 1, 1], 3>;
196 defm : SPRWriteResPair<WriteCvtSD2I, [SPRPort00, SPRPort00_01], 7, [1, 1], 2>;
197 defm : SPRWriteResPair<WriteCvtSD2SS, [SPRPort00_01, SPRPort05], 5, [1, 1], 2, 7>;
198 defm : SPRWriteResPair<WriteCvtSS2I, [SPRPort00, SPRPort00_01], 7, [1, 1], 2>;
199 defm : X86WriteRes<WriteCvtSS2SD, [SPRPort00_01, SPRPort05], 5, [1, 1], 2>;
200 defm : X86WriteRes<WriteCvtSS2SDLd, [SPRPort00_01, SPRPort02_03_11], 11, [1, 1], 2>;
201 defm : SPRWriteResPair<WriteDPPD, [SPRPort00_01, SPRPort01_05], 9, [2, 1], 3, 7>;
202 defm : SPRWriteResPair<WriteDPPS, [SPRPort00_01, SPRPort00_06, SPRPort01_05, SPRPort05], 14, [2, 1, 2, 1], 6, 7>;
203 defm : SPRWriteResPair<WriteDPPSY, [SPRPort00_01, SPRPort00_06, SPRPort01_05, SPRPort05], 14, [2, 1, 2, 1], 6, 8>;
204 defm : SPRWriteResPair<WriteDiv16, [SPRPort00_01_05_06_10, SPRPort01], 16, [1, 3], 4, 4>;
205 defm : SPRWriteResPair<WriteDiv32, [SPRPort00_01_05_06_10, SPRPort01], 15, [1, 3], 4, 4>;
206 defm : SPRWriteResPair<WriteDiv64, [SPRPort01], 18, [3], 3>;
207 defm : X86WriteRes<WriteDiv8, [SPRPort01], 17, [3], 3>;
208 defm : X86WriteRes<WriteDiv8Ld, [SPRPort01], 22, [3], 3>;
209 defm : X86WriteRes<WriteEMMS, [SPRPort00, SPRPort00_05, SPRPort00_06], 10, [1, 8, 1], 10>;
210 defm : SPRWriteResPair<WriteFAdd, [SPRPort01_05], 3, [1], 1, 7>;
211 defm : SPRWriteResPair<WriteFAdd64, [SPRPort01_05], 3, [1], 1, 7>;
212 defm : SPRWriteResPair<WriteFAdd64X, [SPRPort01_05], 3, [1], 1, 7>;
213 defm : SPRWriteResPair<WriteFAdd64Y, [SPRPort01_05], 3, [1], 1, 8>;
214 defm : SPRWriteResPair<WriteFAdd64Z, [SPRPort00_05], 4, [1], 1, 7>;
215 defm : SPRWriteResPair<WriteFAddX, [SPRPort00_01], 4, [1], 1, 7>;
216 defm : SPRWriteResPair<WriteFAddY, [SPRPort00_01], 4, [1], 1, 8>;
217 defm : SPRWriteResPair<WriteFAddZ, [SPRPort00], 4, [1], 1, 8>;
218 defm : SPRWriteResPair<WriteFBlend, [SPRPort00_01_05], 1, [1], 1, 7>;
219 defm : SPRWriteResPair<WriteFBlendY, [SPRPort00_01_05], 1, [1], 1, 8>;
220 def : WriteRes<WriteFCMOV, [SPRPort01]> {
223 defm : SPRWriteResPair<WriteFCmp, [SPRPort00_01], 4, [1], 1, 7>;
224 defm : SPRWriteResPair<WriteFCmp64, [SPRPort00_01], 4, [1], 1, 7>;
225 defm : SPRWriteResPair<WriteFCmp64X, [SPRPort00_01], 4, [1], 1, 7>;
226 defm : SPRWriteResPair<WriteFCmp64Y, [SPRPort00_01], 4, [1], 1, 8>;
227 defm : SPRWriteResPair<WriteFCmp64Z, [SPRPort00], 4, [1], 1, 8>;
228 defm : SPRWriteResPair<WriteFCmpX, [SPRPort00_01], 4, [1], 1, 7>;
229 defm : SPRWriteResPair<WriteFCmpY, [SPRPort00_01], 4, [1], 1, 8>;
230 def : WriteRes<WriteFCmpZ, [SPRPort05]> {
233 defm : X86WriteRes<WriteFCmpZLd, [SPRPort00, SPRPort02_03_11], 12, [1, 1], 2>;
234 defm : SPRWriteResPair<WriteFCom, [SPRPort05], 1, [1], 1, 7>;
235 defm : SPRWriteResPair<WriteFComX, [SPRPort00], 3, [1]>;
236 defm : SPRWriteResPair<WriteFDiv, [SPRPort00], 11, [1], 1, 7>;
237 defm : SPRWriteResPair<WriteFDiv64, [SPRPort00], 14, [1], 1, 6>;
238 defm : SPRWriteResPair<WriteFDiv64X, [SPRPort00], 14, [1], 1, 6>;
239 defm : SPRWriteResPair<WriteFDiv64Y, [SPRPort00], 14, [1], 1, 7>;
240 defm : SPRWriteResPair<WriteFDiv64Z, [SPRPort00, SPRPort00_05], 23, [2, 1], 3, 7>;
241 defm : SPRWriteResPair<WriteFDivX, [SPRPort00], 11, [1], 1, 7>;
242 defm : SPRWriteResPair<WriteFDivY, [SPRPort00], 11, [1], 1, 8>;
243 defm : SPRWriteResPair<WriteFDivZ, [SPRPort00, SPRPort00_05], 18, [2, 1], 3, 7>;
244 defm : SPRWriteResPair<WriteFHAdd, [SPRPort01_05, SPRPort05], 6, [1, 2], 3, 6>;
245 defm : SPRWriteResPair<WriteFHAddY, [SPRPort01_05, SPRPort05], 5, [1, 2], 3, 8>;
246 def : WriteRes<WriteFLD0, [SPRPort00_05]>;
247 defm : X86WriteRes<WriteFLD1, [SPRPort00_05], 1, [2], 2>;
248 defm : X86WriteRes<WriteFLDC, [SPRPort00_05], 1, [2], 2>;
249 def : WriteRes<WriteFLoad, [SPRPort02_03_11]> {
252 def : WriteRes<WriteFLoadX, [SPRPort02_03_11]> {
255 def : WriteRes<WriteFLoadY, [SPRPort02_03_11]> {
258 defm : SPRWriteResPair<WriteFLogic, [SPRPort00_01_05], 1, [1], 1, 7>;
259 defm : SPRWriteResPair<WriteFLogicY, [SPRPort00_01_05], 1, [1], 1, 8>;
260 defm : SPRWriteResPair<WriteFLogicZ, [SPRPort00_05], 1, [1], 1, 8>;
261 defm : SPRWriteResPair<WriteFMA, [SPRPort00_01], 4, [1], 1, 7>;
262 defm : SPRWriteResPair<WriteFMAX, [SPRPort00_01], 4, [1], 1, 7>;
263 defm : SPRWriteResPair<WriteFMAY, [SPRPort00_01], 4, [1], 1, 8>;
264 defm : SPRWriteResPair<WriteFMAZ, [SPRPort00], 4, [1], 1, 8>;
265 def : WriteRes<WriteFMOVMSK, [SPRPort00]> {
268 defm : X86WriteRes<WriteFMaskedLoad, [SPRPort00_01_05, SPRPort02_03_11], 8, [1, 1], 2>;
269 defm : X86WriteRes<WriteFMaskedLoadY, [SPRPort00_01_05, SPRPort02_03_11], 9, [1, 1], 2>;
270 defm : X86WriteRes<WriteFMaskedStore32, [SPRPort00, SPRPort04_09, SPRPort07_08], 14, [1, 1, 1], 3>;
271 defm : X86WriteRes<WriteFMaskedStore32Y, [SPRPort00, SPRPort04_09, SPRPort07_08], 14, [1, 1, 1], 3>;
272 defm : X86WriteRes<WriteFMaskedStore64, [SPRPort00, SPRPort04_09, SPRPort07_08], 14, [1, 1, 1], 3>;
273 defm : X86WriteRes<WriteFMaskedStore64Y, [SPRPort00, SPRPort04_09, SPRPort07_08], 14, [1, 1, 1], 3>;
274 defm : X86WriteRes<WriteFMoveX, [], 1, [], 0>;
275 defm : X86WriteRes<WriteFMoveY, [], 1, [], 0>;
276 def : WriteRes<WriteFMoveZ, [SPRPort00_05]>;
277 defm : SPRWriteResPair<WriteFMul, [SPRPort00_01], 4, [1], 1, 7>;
278 defm : SPRWriteResPair<WriteFMul64, [SPRPort00_01], 4, [1], 1, 7>;
279 defm : SPRWriteResPair<WriteFMul64X, [SPRPort00_01], 4, [1], 1, 7>;
280 defm : SPRWriteResPair<WriteFMul64Y, [SPRPort00_01], 4, [1], 1, 8>;
281 defm : SPRWriteResPair<WriteFMul64Z, [SPRPort00], 4, [1], 1, 8>;
282 defm : SPRWriteResPair<WriteFMulX, [SPRPort00_01], 4, [1], 1, 7>;
283 defm : SPRWriteResPair<WriteFMulY, [SPRPort00_01], 4, [1], 1, 8>;
284 defm : SPRWriteResPair<WriteFMulZ, [SPRPort00], 4, [1], 1, 8>;
285 defm : SPRWriteResPair<WriteFRcp, [SPRPort00], 4, [1], 1, 7>;
286 defm : SPRWriteResPair<WriteFRcpX, [SPRPort00], 4, [1], 1, 7>;
287 defm : SPRWriteResPair<WriteFRcpY, [SPRPort00], 4, [1], 1, 8>;
288 defm : SPRWriteResPair<WriteFRcpZ, [SPRPort00, SPRPort00_05], 7, [2, 1], 3, 7>;
289 defm : SPRWriteResPair<WriteFRnd, [SPRPort00_01], 4, [1], 1, 7>;
290 defm : SPRWriteResPair<WriteFRndY, [SPRPort00_01], 4, [1], 1, 8>;
291 defm : SPRWriteResPair<WriteFRndZ, [SPRPort00], 4, [1], 1, 8>;
292 defm : SPRWriteResPair<WriteFRsqrt, [SPRPort00], 4, [1], 1, 7>;
293 defm : SPRWriteResPair<WriteFRsqrtX, [SPRPort00], 4, [1], 1, 7>;
294 defm : SPRWriteResPair<WriteFRsqrtY, [SPRPort00], 4, [1], 1, 8>;
295 defm : SPRWriteResPair<WriteFRsqrtZ, [SPRPort00, SPRPort00_05], 9, [2, 1], 3>;
296 defm : SPRWriteResPair<WriteFShuffle, [SPRPort05], 1, [1], 1, 7>;
297 defm : SPRWriteResPair<WriteFShuffle256, [SPRPort05], 3, [1], 1, 8>;
298 defm : SPRWriteResPair<WriteFShuffleY, [SPRPort05], 1, [1], 1, 8>;
299 defm : SPRWriteResPair<WriteFShuffleZ, [SPRPort05], 1, [1], 1, 8>;
300 def : WriteRes<WriteFSign, [SPRPort00]>;
301 defm : SPRWriteResPair<WriteFSqrt, [SPRPort00], 12, [1], 1, 7>;
302 defm : SPRWriteResPair<WriteFSqrt64, [SPRPort00], 18, [1]>;
303 defm : SPRWriteResPair<WriteFSqrt64X, [SPRPort00], 18, [1], 1, 6>;
304 defm : SPRWriteResPair<WriteFSqrt64Y, [SPRPort00], 18, [1], 1, 3>;
305 // Warning: negtive load latency.
306 defm : SPRWriteResPair<WriteFSqrt64Z, [SPRPort00, SPRPort00_05], 32, [2, 1], 3, -1>;
307 def : WriteRes<WriteFSqrt80, [SPRPortInvalid, SPRPort00]> {
308 let ReleaseAtCycles = [7, 1];
311 defm : SPRWriteResPair<WriteFSqrtX, [SPRPort00], 12, [1], 1, 7>;
312 defm : SPRWriteResPair<WriteFSqrtY, [SPRPort00], 12, [1], 1, 8>;
313 defm : SPRWriteResPair<WriteFSqrtZ, [SPRPort00, SPRPort00_05], 20, [2, 1], 3, 7>;
314 defm : X86WriteRes<WriteFStore, [SPRPort04_09, SPRPort07_08], 12, [1, 1], 2>;
315 defm : X86WriteResUnsupported<WriteFStoreNT>;
316 defm : X86WriteRes<WriteFStoreNTX, [SPRPort04_09, SPRPort07_08], 518, [1, 1], 2>;
317 defm : X86WriteRes<WriteFStoreNTY, [SPRPort04_09, SPRPort07_08], 542, [1, 1], 2>;
318 defm : X86WriteRes<WriteFStoreX, [SPRPort04_09, SPRPort07_08], 12, [1, 1], 2>;
319 defm : X86WriteRes<WriteFStoreY, [SPRPort04_09, SPRPort07_08], 12, [1, 1], 2>;
320 defm : SPRWriteResPair<WriteFTest, [SPRPort00], 3, [1]>;
321 defm : SPRWriteResPair<WriteFTestY, [SPRPort00], 5, [1], 1, 6>;
322 defm : SPRWriteResPair<WriteFVarBlend, [SPRPort00_01_05], 1, [1], 1, 7>;
323 defm : SPRWriteResPair<WriteFVarBlendY, [SPRPort00_01_05], 1, [1], 1, 8>;
324 defm : SPRWriteResPair<WriteFVarBlendZ, [SPRPort00_05], 1, [1], 1, 8>;
325 defm : SPRWriteResPair<WriteFVarShuffle, [SPRPort05], 1, [1], 1, 7>;
326 defm : SPRWriteResPair<WriteFVarShuffle256, [SPRPort05], 3, [1], 1, 8>;
327 defm : SPRWriteResPair<WriteFVarShuffleY, [SPRPort05], 1, [1], 1, 8>;
328 defm : SPRWriteResPair<WriteFVarShuffleZ, [SPRPort05], 1, [1], 1, 8>;
329 def : WriteRes<WriteFence, [SPRPort00_06]> {
332 defm : SPRWriteResPair<WriteIDiv16, [SPRPort00_01_05_06_10, SPRPort01], 16, [1, 3], 4, 4>;
333 defm : SPRWriteResPair<WriteIDiv32, [SPRPort00_01_05_06_10, SPRPort01], 15, [1, 3], 4, 4>;
334 defm : SPRWriteResPair<WriteIDiv64, [SPRPort01], 18, [3], 3>;
335 defm : X86WriteRes<WriteIDiv8, [SPRPort01], 17, [3], 3>;
336 defm : X86WriteRes<WriteIDiv8Ld, [SPRPort01], 22, [3], 3>;
337 defm : SPRWriteResPair<WriteIMul16, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01], 5, [2, 1, 1], 4>;
338 defm : SPRWriteResPair<WriteIMul16Imm, [SPRPort00_01_05_06_10, SPRPort01], 4, [1, 1], 2>;
339 defm : SPRWriteResPair<WriteIMul16Reg, [SPRPort01], 3, [1]>;
340 defm : SPRWriteResPair<WriteIMul32, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01], 4, [1, 1, 1], 3>;
341 defm : SPRWriteResPair<WriteIMul32Imm, [SPRPort01], 3, [1]>;
342 defm : SPRWriteResPair<WriteIMul32Reg, [SPRPort01], 3, [1]>;
343 defm : SPRWriteResPair<WriteIMul64, [SPRPort01, SPRPort05], 4, [1, 1], 2>;
344 defm : SPRWriteResPair<WriteIMul64Imm, [SPRPort01], 3, [1]>;
345 defm : SPRWriteResPair<WriteIMul64Reg, [SPRPort01], 3, [1]>;
346 defm : SPRWriteResPair<WriteIMul8, [SPRPort01], 3, [1]>;
347 def : WriteRes<WriteIMulH, []> {
350 def : WriteRes<WriteIMulHLd, []> {
353 defm : SPRWriteResPair<WriteJump, [SPRPort00_06], 1, [1]>;
354 def : WriteRes<WriteLAHFSAHF, [SPRPort00_06]> {
357 defm : X86WriteRes<WriteLDMXCSR, [SPRPort00, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11], 7, [1, 1, 1, 1], 4>;
358 def : WriteRes<WriteLEA, [SPRPort01]>;
359 defm : SPRWriteResPair<WriteLZCNT, [SPRPort01], 3, [1]>;
360 def : WriteRes<WriteLoad, [SPRPort02_03_11]> {
363 def : WriteRes<WriteMMXMOVMSK, [SPRPort00]> {
366 defm : SPRWriteResPair<WriteMPSAD, [SPRPort01_05, SPRPort05], 4, [1, 1], 2, 7>;
367 defm : SPRWriteResPair<WriteMPSADY, [SPRPort01_05, SPRPort05], 4, [1, 1], 2, 8>;
368 defm : SPRWriteResPair<WriteMULX32, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01], 4, [1, 1, 1], 2>;
369 defm : SPRWriteResPair<WriteMULX64, [SPRPort01, SPRPort05], 4, [1, 1]>;
370 def : WriteRes<WriteMicrocoded, [SPRPort00_01_05_06]> {
371 let Latency = SapphireRapidsModel.MaxLatency;
373 def : WriteRes<WriteMove, [SPRPort00]> {
376 defm : X86WriteRes<WriteNop, [], 1, [], 0>;
377 defm : X86WriteRes<WritePCmpEStrI, [SPRPort00, SPRPort00_01_05, SPRPort00_06, SPRPort01, SPRPort05], 16, [3, 2, 1, 1, 1], 8>;
378 defm : X86WriteRes<WritePCmpEStrILd, [SPRPort00, SPRPort00_01_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05], 31, [3, 1, 1, 1, 1, 1], 8>;
379 defm : X86WriteRes<WritePCmpEStrM, [SPRPort00, SPRPort00_01_05, SPRPort00_06, SPRPort01, SPRPort05], 16, [3, 3, 1, 1, 1], 9>;
380 defm : X86WriteRes<WritePCmpEStrMLd, [SPRPort00, SPRPort00_01_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05], 17, [3, 2, 1, 1, 1, 1], 9>;
381 defm : SPRWriteResPair<WritePCmpIStrI, [SPRPort00], 11, [3], 3, 20>;
382 defm : SPRWriteResPair<WritePCmpIStrM, [SPRPort00], 11, [3], 3>;
383 defm : SPRWriteResPair<WritePHAdd, [SPRPort00_05, SPRPort05], 3, [1, 2], 3, 8>;
384 defm : SPRWriteResPair<WritePHAddX, [SPRPort00_01_05, SPRPort01_05], 2, [1, 2], 3, 7>;
385 defm : SPRWriteResPair<WritePHAddY, [SPRPort00_01_05, SPRPort01_05], 2, [1, 2], 3, 8>;
386 defm : SPRWriteResPair<WritePHMINPOS, [SPRPort00], 4, [1], 1, 7>;
387 defm : SPRWriteResPair<WritePMULLD, [SPRPort00_01], 10, [2], 2, 8>;
388 defm : SPRWriteResPair<WritePMULLDY, [SPRPort00_01], 10, [2], 2, 8>;
389 defm : SPRWriteResPair<WritePMULLDZ, [SPRPort00], 10, [2], 2, 8>;
390 defm : SPRWriteResPair<WritePOPCNT, [SPRPort01], 3, [1]>;
391 defm : SPRWriteResPair<WritePSADBW, [SPRPort05], 3, [1], 1, 8>;
392 defm : SPRWriteResPair<WritePSADBWX, [SPRPort05], 3, [1], 1, 7>;
393 defm : SPRWriteResPair<WritePSADBWY, [SPRPort05], 3, [1], 1, 8>;
394 defm : SPRWriteResPair<WritePSADBWZ, [SPRPort05], 3, [1], 1, 8>;
395 defm : X86WriteRes<WriteRMW, [SPRPort02_03_11, SPRPort04_09, SPRPort07_08], 1, [1, 1, 1], 3>;
396 defm : X86WriteRes<WriteRotate, [SPRPort00_01_05_06_10, SPRPort00_06], 2, [1, 2], 3>;
397 defm : X86WriteRes<WriteRotateLd, [SPRPort00_01_05_06_10, SPRPort00_06], 12, [1, 2], 3>;
398 defm : X86WriteRes<WriteRotateCL, [SPRPort00_06], 2, [2], 2>;
399 defm : X86WriteRes<WriteRotateCLLd, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01], 19, [2, 3, 2], 7>;
400 defm : X86WriteRes<WriteSETCC, [SPRPort00_06], 2, [2], 2>;
401 defm : X86WriteRes<WriteSETCCStore, [SPRPort00_06, SPRPort04_09, SPRPort07_08], 13, [2, 1, 1], 4>;
402 defm : X86WriteRes<WriteSHDmrcl, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08], 12, [1, 1, 1, 1, 1, 1], 6>;
403 defm : X86WriteRes<WriteSHDmri, [SPRPort00_01_05_06_10, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08], 12, [1, 1, 1, 1, 1], 5>;
404 defm : X86WriteRes<WriteSHDrrcl, [SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01], 5, [1, 1, 1], 3>;
405 def : WriteRes<WriteSHDrri, [SPRPort01]> {
408 defm : X86WriteRes<WriteSTMXCSR, [SPRPort00, SPRPort00_06, SPRPort04_09, SPRPort07_08], 12, [1, 1, 1, 1], 4>;
409 def : WriteRes<WriteShift, [SPRPort00_06]>;
410 def : WriteRes<WriteShiftLd, [SPRPort00_06]> {
413 defm : X86WriteRes<WriteShiftCL, [SPRPort00_06], 2, [2], 2>;
414 defm : X86WriteRes<WriteShiftCLLd, [SPRPort00_06], 12, [2], 2>;
415 defm : SPRWriteResPair<WriteShuffle, [SPRPort05], 1, [1], 1, 8>;
416 defm : SPRWriteResPair<WriteShuffle256, [SPRPort05], 3, [1], 1, 8>;
417 defm : SPRWriteResPair<WriteShuffleX, [SPRPort01_05], 1, [1], 1, 7>;
418 defm : SPRWriteResPair<WriteShuffleY, [SPRPort01_05], 1, [1], 1, 8>;
419 defm : SPRWriteResPair<WriteShuffleZ, [SPRPort05], 3, [1], 1, 6>;
420 defm : X86WriteRes<WriteStore, [SPRPort04_09, SPRPort07_08], 12, [1, 1], 2>;
421 defm : X86WriteRes<WriteStoreNT, [SPRPort04_09, SPRPort07_08], 512, [1, 1], 2>;
422 def : WriteRes<WriteSystem, [SPRPort00_01_05_06]> {
423 let Latency = SapphireRapidsModel.MaxLatency;
425 defm : SPRWriteResPair<WriteTZCNT, [SPRPort01], 3, [1]>;
426 defm : SPRWriteResPair<WriteVPMOV256, [SPRPort05], 3, [1], 1, 8>;
427 defm : SPRWriteResPair<WriteVarBlend, [SPRPort00_01_05], 1, [1], 1, 7>;
428 defm : SPRWriteResPair<WriteVarBlendY, [SPRPort00_01_05], 1, [1], 1, 8>;
429 defm : SPRWriteResPair<WriteVarBlendZ, [SPRPort00_05], 1, [1], 1, 8>;
430 defm : SPRWriteResPair<WriteVarShuffle, [SPRPort00, SPRPort05], 3, [1, 1], 2, 8>;
431 defm : X86WriteRes<WriteVarShuffle256, [SPRPort05], 6, [2], 2>;
432 defm : X86WriteRes<WriteVarShuffle256Ld, [SPRPort02_03_11, SPRPort05], 11, [1, 1], 2>;
433 defm : SPRWriteResPair<WriteVarShuffleX, [SPRPort01_05], 1, [1], 1, 7>;
434 defm : SPRWriteResPair<WriteVarShuffleY, [SPRPort01_05], 1, [1], 1, 8>;
435 defm : SPRWriteResPair<WriteVarShuffleZ, [SPRPort05], 3, [1], 1, 8>;
436 defm : SPRWriteResPair<WriteVarVecShift, [SPRPort00_01], 1, [1], 1, 7>;
437 defm : SPRWriteResPair<WriteVarVecShiftY, [SPRPort00_01], 1, [1], 1, 8>;
438 defm : SPRWriteResPair<WriteVarVecShiftZ, [SPRPort00], 1, [1], 1, 8>;
439 defm : SPRWriteResPair<WriteVecALU, [SPRPort00], 1, [1], 1, 8>;
440 defm : SPRWriteResPair<WriteVecALUX, [SPRPort00_01], 1, [1], 1, 7>;
441 defm : SPRWriteResPair<WriteVecALUY, [SPRPort00_01], 1, [1], 1, 8>;
442 def : WriteRes<WriteVecALUZ, [SPRPort05]> {
445 defm : X86WriteRes<WriteVecALUZLd, [SPRPort00, SPRPort02_03_11], 9, [1, 1], 2>;
446 defm : X86WriteRes<WriteVecExtract, [SPRPort00, SPRPort01_05], 4, [1, 1], 2>;
447 defm : X86WriteRes<WriteVecExtractSt, [SPRPort01_05, SPRPort04_09, SPRPort07_08], 19, [1, 1, 1], 3>;
448 defm : SPRWriteResPair<WriteVecIMul, [SPRPort00], 5, [1], 1, 8>;
449 defm : SPRWriteResPair<WriteVecIMulX, [SPRPort00_01], 5, [1], 1, 8>;
450 defm : SPRWriteResPair<WriteVecIMulY, [SPRPort00_01], 5, [1], 1, 8>;
451 defm : SPRWriteResPair<WriteVecIMulZ, [SPRPort00], 5, [1], 1, 8>;
452 defm : X86WriteRes<WriteVecInsert, [SPRPort01_05, SPRPort05], 4, [1, 1], 2>;
453 defm : X86WriteRes<WriteVecInsertLd, [SPRPort01_05, SPRPort02_03_11], 8, [1, 1], 2>;
454 def : WriteRes<WriteVecLoad, [SPRPort02_03_11]> {
457 def : WriteRes<WriteVecLoadNT, [SPRPort02_03_11]> {
460 def : WriteRes<WriteVecLoadNTY, [SPRPort02_03_11]> {
463 def : WriteRes<WriteVecLoadX, [SPRPort02_03_11]> {
466 def : WriteRes<WriteVecLoadY, [SPRPort02_03_11]> {
469 defm : SPRWriteResPair<WriteVecLogic, [SPRPort00_05], 1, [1], 1, 8>;
470 defm : SPRWriteResPair<WriteVecLogicX, [SPRPort00_01_05], 1, [1], 1, 7>;
471 defm : SPRWriteResPair<WriteVecLogicY, [SPRPort00_01_05], 1, [1], 1, 8>;
472 defm : SPRWriteResPair<WriteVecLogicZ, [SPRPort00_05], 1, [1], 1, 8>;
473 def : WriteRes<WriteVecMOVMSK, [SPRPort00]> {
476 def : WriteRes<WriteVecMOVMSKY, [SPRPort00]> {
479 defm : X86WriteRes<WriteVecMaskedGatherWriteback, [], 5, [], 0>;
480 defm : X86WriteRes<WriteVecMaskedLoad, [SPRPort00_01_05, SPRPort02_03_11], 8, [1, 1], 2>;
481 defm : X86WriteRes<WriteVecMaskedLoadY, [SPRPort00_01_05, SPRPort02_03_11], 9, [1, 1], 2>;
482 defm : X86WriteRes<WriteVecMaskedStore32, [SPRPort00, SPRPort04_09, SPRPort07_08], 14, [1, 1, 1], 3>;
483 defm : X86WriteRes<WriteVecMaskedStore32Y, [SPRPort00, SPRPort04_09, SPRPort07_08], 14, [1, 1, 1], 3>;
484 defm : X86WriteRes<WriteVecMaskedStore64, [SPRPort00, SPRPort04_09, SPRPort07_08], 14, [1, 1, 1], 3>;
485 defm : X86WriteRes<WriteVecMaskedStore64Y, [SPRPort00, SPRPort04_09, SPRPort07_08], 14, [1, 1, 1], 3>;
486 def : WriteRes<WriteVecMove, [SPRPort00_05]>;
487 def : WriteRes<WriteVecMoveFromGpr, [SPRPort05]> {
490 def : WriteRes<WriteVecMoveToGpr, [SPRPort00]> {
493 defm : X86WriteRes<WriteVecMoveX, [], 1, [], 0>;
494 def : WriteRes<WriteVecMoveY, [SPRPort00_01_05]>;
495 def : WriteRes<WriteVecMoveZ, [SPRPort00_05]>;
496 defm : SPRWriteResPair<WriteVecShift, [SPRPort00], 1, [1], 1, 8>;
497 def : WriteRes<WriteVecShiftImm, [SPRPort00]>;
498 defm : SPRWriteResPair<WriteVecShiftImmX, [SPRPort00_01], 1, [1], 1, 7>;
499 defm : SPRWriteResPair<WriteVecShiftImmY, [SPRPort00_01], 1, [1], 1, 8>;
500 defm : SPRWriteResPair<WriteVecShiftImmZ, [SPRPort00], 1, [1], 1, 8>;
501 defm : X86WriteRes<WriteVecShiftX, [SPRPort00_01, SPRPort01_05], 2, [1, 1], 2>;
502 defm : X86WriteRes<WriteVecShiftXLd, [SPRPort00_01, SPRPort02_03_11], 8, [1, 1], 2>;
503 defm : X86WriteRes<WriteVecShiftY, [SPRPort00_01, SPRPort05], 4, [1, 1], 2>;
504 defm : X86WriteRes<WriteVecShiftYLd, [SPRPort00_01, SPRPort02_03_11], 9, [1, 1], 2>;
505 defm : X86WriteRes<WriteVecShiftZ, [SPRPort00, SPRPort05], 4, [1, 1], 2>;
506 defm : X86WriteRes<WriteVecShiftZLd, [SPRPort00, SPRPort02_03_11], 9, [1, 1], 2>;
507 defm : X86WriteRes<WriteVecStore, [SPRPort04_09, SPRPort07_08], 12, [1, 1], 2>;
508 defm : X86WriteRes<WriteVecStoreNT, [SPRPort04_09, SPRPort07_08], 511, [1, 1], 2>;
509 defm : X86WriteRes<WriteVecStoreNTY, [SPRPort04_09, SPRPort07_08], 507, [1, 1], 2>;
510 defm : X86WriteRes<WriteVecStoreX, [SPRPort04_09, SPRPort07_08], 12, [1, 1], 2>;
511 defm : X86WriteRes<WriteVecStoreY, [SPRPort04_09, SPRPort07_08], 12, [1, 1], 2>;
512 defm : SPRWriteResPair<WriteVecTest, [SPRPort00, SPRPort05], 4, [1, 1], 2>;
513 defm : SPRWriteResPair<WriteVecTestY, [SPRPort00, SPRPort05], 6, [1, 1], 2, 6>;
514 defm : X86WriteRes<WriteXCHG, [SPRPort00_01_05_06_10], 2, [3], 3>;
515 def : WriteRes<WriteZero, []>;
517 // Infered SchedWriteRes and InstRW definition.
519 def SPRWriteResGroup0 : SchedWriteRes<[SPRPort02_03, SPRPort02_03_11, SPRPort04, SPRPort04_09]> {
523 def : InstRW<[SPRWriteResGroup0], (instregex "^AA(D|N)D64mr$",
526 def SPRWriteResGroup1 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
527 let ReleaseAtCycles = [2, 1, 1, 1, 1];
531 def : InstRW<[SPRWriteResGroup1, ReadAfterLd, ReadAfterLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^(ADC|SBB)(16|32|64)mr$")>;
533 def SPRWriteResGroup2 : SchedWriteRes<[SPRPort00_06, SPRPort02_03_11]> {
537 def : InstRW<[SPRWriteResGroup2], (instregex "^RORX(32|64)mi$")>;
538 def : InstRW<[SPRWriteResGroup2, ReadAfterLd, ReadAfterLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^(ADC|SBB)(8|16|32|64)rm$",
539 "^AD(C|O)X(32|64)rm$")>;
541 def SPRWriteResGroup3 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
545 def : InstRW<[SPRWriteResGroup3], (instregex "^(ADC|SBB)8mi(8?)$")>;
547 def SPRWriteResGroup4 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
548 let ReleaseAtCycles = [2, 1, 1, 1, 1];
552 def : InstRW<[SPRWriteResGroup4, ReadAfterLd, ReadAfterLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^(ADC|SBB)8mr$")>;
554 def SPRWriteResGroup5 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
558 def : InstRW<[SPRWriteResGroup5], (instregex "^CMP(8|16|32)mi$",
559 "^CMP(8|16|32|64)mi8$",
561 "^POP(16|32)r((mr)?)$")>;
562 def : InstRW<[SPRWriteResGroup5], (instrs CMP64mi32,
565 def : InstRW<[SPRWriteResGroup5, ReadAfterLd], (instregex "^(ADD|CMP|SUB)(8|16|32|64)rm$",
567 "^(X?)OR(8|16|32)rm$")>;
568 def : InstRW<[SPRWriteResGroup5, ReadAfterLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^CMP(8|16|32|64)mr$")>;
570 def SPRWriteResGroup6 : SchedWriteRes<[]> {
573 def : InstRW<[SPRWriteResGroup6], (instregex "^(ADD|SUB)64ri8$",
575 "^MOV64rr((_REV)?)$",
576 "^VMOV(A|U)P(D|S)Zrr((_REV)?)$",
577 "^VMOVDQA(32|64)Z((256)?)rr((_REV)?)$",
578 "^VMOVDQ(A|U)Yrr((_REV)?)$",
579 "^VMOVDQU(8|16|32|64)Z((256)?)rr((_REV)?)$")>;
580 def : InstRW<[SPRWriteResGroup6], (instrs CLC,
583 def SPRWriteResGroup7 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
587 def : InstRW<[SPRWriteResGroup7], (instregex "^A(D|N)D8mi(8?)$",
592 def : InstRW<[SPRWriteResGroup7, ReadAfterLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^A(D|N)D8mr$",
594 def : InstRW<[SPRWriteResGroup7, ReadAfterLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instrs SUB8mr)>;
596 def SPRWriteResGroup8 : SchedWriteRes<[SPRPort01_05, SPRPort02_03_11]> {
600 def : InstRW<[SPRWriteResGroup8, ReadAfterVecXLd], (instregex "^(V?)(ADD|SUB)PSrm$",
602 "^V(ADD|SUB)PSZ128rm((b|k|bk|kz)?)$",
603 "^V(ADD|SUB)PSZ128rmbkz$")>;
605 def SPRWriteResGroup9 : SchedWriteRes<[SPRPort01_05]> {
608 def : InstRW<[SPRWriteResGroup9], (instregex "^(V?)(ADD|SUB)PSrr$",
611 "^V(ADD|SUB)PSZ(128|256)rr(k?)$",
612 "^VPMOV(S|Z)XBWZ128rrk(z?)$",
613 "^VPSHUFBZ(128|256)rrk(z?)$",
614 "^VPSHUF(H|L)WZ(128|256)rik(z?)$",
615 "^VPUNPCK(H|L)(BW|WD)Z(128|256)rrk(z?)$")>;
616 def : InstRW<[SPRWriteResGroup9], (instrs VADDSUBPSYrr)>;
618 def SPRWriteResGroup10 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
622 def : InstRW<[SPRWriteResGroup10], (instregex "^ADD_F(32|64)m$",
623 "^ILD_F(16|32|64)m$",
624 "^SUB(R?)_F(32|64)m$",
625 "^VPOPCNT(B|D|Q|W)Z128rm$",
626 "^VPOPCNT(D|Q)Z128rm(b|k|kz)$",
627 "^VPOPCNT(D|Q)Z128rmbk(z?)$")>;
628 def : InstRW<[SPRWriteResGroup10, ReadAfterVecXLd], (instregex "^(V?)PACK(S|U)S(DW|WB)rm$",
630 "^VFPCLASSP(D|H|S)Z128rmb$",
631 "^VPACK(S|U)S(DW|WB)Z128rm$",
632 "^VPACK(S|U)SDWZ128rmb$",
633 "^VPM(AX|IN)(S|U)QZ128rm((b|k|bk|kz)?)$",
634 "^VPM(AX|IN)(S|U)QZ128rmbkz$",
635 "^VPMULTISHIFTQBZ128rm(b?)$")>;
636 def : InstRW<[SPRWriteResGroup10, ReadAfterVecXLd], (instrs VFPCLASSPHZ128rm)>;
637 def : InstRW<[SPRWriteResGroup10, ReadAfterVecYLd], (instregex "^VFPCLASSP(D|H|S)Z((256)?)rm$",
638 "^VPERM(I|T)2(D|Q|PS)Z128rm((b|k|bk|kz)?)$",
639 "^VPERM(I|T)2(D|Q|PS)Z128rmbkz$",
640 "^VPERM(I|T)2PDZ128rm((b|k|bk|kz)?)$",
641 "^VPERM(I|T)2PDZ128rmbkz$")>;
642 def : InstRW<[SPRWriteResGroup10, ReadAfterVecYLd], (instrs VPERMBZ128rm)>;
644 def SPRWriteResGroup11 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
645 let ReleaseAtCycles = [1, 2];
649 def : InstRW<[SPRWriteResGroup11], (instregex "^ADD_FI(16|32)m$",
650 "^SUB(R?)_FI(16|32)m$")>;
651 def : InstRW<[SPRWriteResGroup11, ReadAfterVecXLd], (instrs SHA256MSG2rm)>;
652 def : InstRW<[SPRWriteResGroup11, ReadAfterVecYLd], (instregex "^VPEXPAND(B|W)Z(128|256)rmk(z?)$",
653 "^VPEXPAND(B|W)Zrmk(z?)$")>;
655 def SPRWriteResGroup12 : SchedWriteRes<[SPRPort05]> {
658 def : InstRW<[SPRWriteResGroup12], (instregex "^ADD_F(P?)rST0$",
660 "^(V?)PACK(S|U)S(DW|WB)rr$",
662 "^SUB(R?)_F(P?)rST0$",
664 "^VALIGN(D|Q)Z256rri((k|kz)?)$",
665 "^VCMPP(D|H|S)Z(128|256)rri(k?)$",
667 "^VCMPS(D|H|S)Zrr(b?)_Int(k?)$",
668 "^VFPCLASSP(D|H|S)Z(128|256)rr(k?)$",
669 "^VFPCLASSS(D|H|S)Zrr(k?)$",
670 "^VPACK(S|U)S(DW|WB)Yrr$",
671 "^VPACK(S|U)S(DW|WB)Z(128|256)rr$",
672 "^VPALIGNRZ(128|256)rrik(z?)$",
673 "^VPBROADCAST(B|W)Z128rrk(z?)$",
674 "^VPCMP(B|D|Q|W|UD|UQ|UW)Z(128|256)rri(k?)$",
675 "^VPCMP(EQ|GT)(B|D|Q|W)Z(128|256)rr(k?)$",
676 "^VPCMPUBZ(128|256)rri(k?)$",
677 "^VPERMBZ(128|256)rr$",
679 "^VPERM(D|Q)Z256rr((k|kz)?)$",
680 "^VPERM(D|Q)Zrrk(z?)$",
681 "^VPERM(I|T)2(D|Q)Z(128|256)rr((k|kz)?)$",
682 "^VPERM(I|T)2(D|Q)Zrr((k|kz)?)$",
683 "^VPM(AX|IN)(S|U)QZ(128|256)rr((k|kz)?)$",
684 "^VPMULTISHIFTQBZ(128|256)rr$",
685 "^VPOPCNT(B|D|Q|W)Z(128|256)rr$",
686 "^VPOPCNT(D|Q)Z(128|256)rrk(z?)$",
687 "^VPTEST(N?)M(B|D|Q|W)Z(128|256)rr(k?)$",
688 "^VPTEST(N?)M(B|D|Q|W)Zrr(k?)$")>;
689 def : InstRW<[SPRWriteResGroup12], (instrs ADD_FST0r,
693 def SPRWriteResGroup13 : SchedWriteRes<[SPRPort00_01_05_06_10]> {
696 def : InstRW<[SPRWriteResGroup13], (instregex "^AND(8|16|32|64)r(r|i8)$",
697 "^AND(8|16|32|64)rr_REV$",
698 "^(AND|TEST)(32|64)i32$",
699 "^(AND|TEST)(8|32)ri$",
700 "^(AND|TEST)64ri32$",
702 "^(X?)OR(8|16|32|64)r(r|i8)$",
703 "^(X?)OR(8|16|32|64)rr_REV$",
704 "^(X?)OR(32|64)i32$",
708 "^TEST(8|16|32|64)rr$")>;
709 def : InstRW<[SPRWriteResGroup13], (instrs XOR8rr_NOREX)>;
711 def SPRWriteResGroup14 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
715 def : InstRW<[SPRWriteResGroup14], (instregex "^TEST(8|16|32)mi$")>;
716 def : InstRW<[SPRWriteResGroup14], (instrs TEST64mi32)>;
717 def : InstRW<[SPRWriteResGroup14, ReadAfterLd], (instregex "^(X?)OR64rm$")>;
718 def : InstRW<[SPRWriteResGroup14, ReadAfterLd], (instrs AND64rm)>;
719 def : InstRW<[SPRWriteResGroup14, ReadAfterLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^TEST(8|16|32|64)mr$")>;
721 def SPRWriteResGroup15 : SchedWriteRes<[SPRPort01_05_10, SPRPort02_03_11]> {
725 def : InstRW<[SPRWriteResGroup15, ReadAfterLd], (instregex "^ANDN(32|64)rm$")>;
727 def SPRWriteResGroup16 : SchedWriteRes<[SPRPort01_05_10]> {
730 def : InstRW<[SPRWriteResGroup16], (instregex "^ANDN(32|64)rr$")>;
732 def SPRWriteResGroup17 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11]> {
733 let ReleaseAtCycles = [5, 2, 1, 1];
737 def : InstRW<[SPRWriteResGroup17], (instrs BT64mr)>;
739 def SPRWriteResGroup18 : SchedWriteRes<[SPRPort01]> {
742 def : InstRW<[SPRWriteResGroup18], (instregex "^BT((C|R|S)?)64rr$",
743 "^P(DEP|EXT)(32|64)rr$")>;
745 def SPRWriteResGroup19 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
746 let ReleaseAtCycles = [4, 2, 1, 1, 1, 1];
748 let NumMicroOps = 10;
750 def : InstRW<[SPRWriteResGroup19], (instregex "^BT(C|R|S)64mr$")>;
752 def SPRWriteResGroup20 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
756 def : InstRW<[SPRWriteResGroup20], (instregex "^CALL(16|32|64)m((_NT)?)$")>;
758 def SPRWriteResGroup21 : SchedWriteRes<[SPRPort00_06, SPRPort04_09, SPRPort07_08]> {
762 def : InstRW<[SPRWriteResGroup21], (instregex "^CALL(16|32|64)r((_NT)?)$")>;
764 def SPRWriteResGroup22 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
768 def : InstRW<[SPRWriteResGroup22], (instrs CALL64pcrel32,
771 def SPRWriteResGroup23 : SchedWriteRes<[SPRPort01_05]>;
772 def : InstRW<[SPRWriteResGroup23], (instregex "^C(DQ|WD)E$",
773 "^(V?)MOVS(H|L)DUPrr$",
774 "^(V?)SHUFP(D|S)rri$",
775 "^VMOVS(H|L)DUPYrr$",
776 "^VMOVS(H|L)DUPZ(128|256)rr((k|kz)?)$",
777 "^VPMOVQDZ128rr((k|kz)?)$",
779 "^VSHUFP(D|S)Z(128|256)rri((k|kz)?)$")>;
780 def : InstRW<[SPRWriteResGroup23], (instrs CBW,
783 def SPRWriteResGroup24 : SchedWriteRes<[SPRPort00_06]>;
784 def : InstRW<[SPRWriteResGroup24], (instregex "^C(DQ|QO)$",
787 def SPRWriteResGroup25 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06]> {
791 def : InstRW<[SPRWriteResGroup25], (instrs CLD)>;
793 def SPRWriteResGroup26 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
797 def : InstRW<[SPRWriteResGroup26], (instrs CLDEMOTE)>;
799 def SPRWriteResGroup27 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort04_09, SPRPort07_08]> {
803 def : InstRW<[SPRWriteResGroup27], (instrs CLFLUSH)>;
805 def SPRWriteResGroup28 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
809 def : InstRW<[SPRWriteResGroup28], (instrs CLFLUSHOPT)>;
811 def SPRWriteResGroup29 : SchedWriteRes<[SPRPort00_06, SPRPort01]> {
812 let ReleaseAtCycles = [2, 1];
813 let Latency = SapphireRapidsModel.MaxLatency;
816 def : InstRW<[SPRWriteResGroup29], (instrs CLI)>;
818 def SPRWriteResGroup30 : SchedWriteRes<[SPRPort00_06, SPRPort01, SPRPort05]> {
819 let ReleaseAtCycles = [6, 1, 3];
820 let Latency = SapphireRapidsModel.MaxLatency;
821 let NumMicroOps = 10;
823 def : InstRW<[SPRWriteResGroup30], (instrs CLTS)>;
825 def SPRWriteResGroup31 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
829 def : InstRW<[SPRWriteResGroup31], (instregex "^MOV16o(16|32|64)a$")>;
830 def : InstRW<[SPRWriteResGroup31], (instrs CLWB)>;
832 def SPRWriteResGroup32 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
833 let ReleaseAtCycles = [5, 2];
837 def : InstRW<[SPRWriteResGroup32], (instregex "^CMPS(B|L|Q|W)$")>;
839 def SPRWriteResGroup33 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01_05, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
840 let ReleaseAtCycles = [2, 7, 6, 2, 1, 1, 2, 1];
842 let NumMicroOps = 22;
844 def : InstRW<[SPRWriteResGroup33], (instrs CMPXCHG16B)>;
846 def SPRWriteResGroup34 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
847 let ReleaseAtCycles = [4, 7, 2, 1, 1, 1];
849 let NumMicroOps = 16;
851 def : InstRW<[SPRWriteResGroup34], (instrs CMPXCHG8B)>;
853 def SPRWriteResGroup35 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
854 let ReleaseAtCycles = [1, 2, 1, 1, 1];
858 def : InstRW<[SPRWriteResGroup35], (instrs CMPXCHG8rm)>;
860 def SPRWriteResGroup36 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_06, SPRPort01, SPRPort04_09, SPRPort05, SPRPort07_08]> {
861 let ReleaseAtCycles = [2, 1, 10, 6, 1, 5, 1];
863 let NumMicroOps = 26;
865 def : InstRW<[SPRWriteResGroup36], (instrs CPUID)>;
867 def SPRWriteResGroup37 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
871 def : InstRW<[SPRWriteResGroup37], (instregex "^(V?)CVT(T?)PD2DQrm$",
872 "^VCVT(T?)PD2(U?)DQZ128rm((b|k|bk|kz)?)$",
873 "^VCVT(T?)PD2(U?)DQZ128rmbkz$",
874 "^VCVTPH2PSXZ128rm(b?)$",
875 "^VCVT(U?)QQ2PSZ128rm((b|k|bk|kz)?)$",
876 "^VCVT(U?)QQ2PSZ128rmbkz$")>;
877 def : InstRW<[SPRWriteResGroup37], (instrs CVTSI642SSrm)>;
878 def : InstRW<[SPRWriteResGroup37, ReadAfterVecLd], (instregex "^(V?)CVTSI642SSrm_Int$",
879 "^VCVT(U?)SI642SSZrm((_Int)?)$")>;
880 def : InstRW<[SPRWriteResGroup37, ReadAfterVecLd], (instrs VCVTSI642SSrm)>;
882 def SPRWriteResGroup38 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort02_03_11]> {
886 def : InstRW<[SPRWriteResGroup38], (instregex "^(V?)CVT(T?)SD2SIrm((_Int)?)$")>;
887 def : InstRW<[SPRWriteResGroup38, ReadAfterVecLd], (instregex "^VCVT(T?)SD2SIZrm$",
888 "^VCVT(T?)SD2(U?)SIZrm_Int$")>;
889 def : InstRW<[SPRWriteResGroup38, ReadAfterVecLd], (instrs VCVTTSD2USIZrm)>;
891 def SPRWriteResGroup39 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
895 def : InstRW<[SPRWriteResGroup39], (instregex "^VCVT(T?)PS2(U?)QQZ256rr((k|kz)?)$",
896 "^VCVT(U?)QQ2PSZ256rr((k|kz)?)$")>;
897 def : InstRW<[SPRWriteResGroup39, ReadInt2Fpu], (instrs CVTSI2SSrr)>;
898 def : InstRW<[SPRWriteResGroup39, ReadDefault, ReadInt2Fpu], (instregex "^(V?)CVTSI2SSrr_Int$",
899 "^VCVT(U?)SI2SSZrr$",
900 "^VCVT(U?)SI2SSZrr(b?)_Int$")>;
901 def : InstRW<[SPRWriteResGroup39, ReadDefault, ReadInt2Fpu], (instrs VCVTSI2SSrr)>;
903 def SPRWriteResGroup40 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
904 let ReleaseAtCycles = [1, 2];
908 def : InstRW<[SPRWriteResGroup40, ReadInt2Fpu], (instrs CVTSI642SSrr)>;
909 def : InstRW<[SPRWriteResGroup40, ReadDefault, ReadInt2Fpu], (instregex "^(V?)CVTSI642SSrr_Int$",
910 "^VCVT(U?)SI642SSZrr$",
911 "^VCVT(U?)SI642SSZrr(b?)_Int$")>;
912 def : InstRW<[SPRWriteResGroup40, ReadDefault, ReadInt2Fpu], (instrs VCVTSI642SSrr)>;
914 def SPRWriteResGroup41 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort05]> {
918 def : InstRW<[SPRWriteResGroup41], (instregex "^(V?)CVT(T?)SS2SI64rr_Int$",
919 "^VCVT(T?)SS2SI64Zrr$",
920 "^VCVT(T?)SS2(U?)SI64Zrr(b?)_Int$")>;
921 def : InstRW<[SPRWriteResGroup41], (instrs VCVTTSS2USI64Zrr)>;
922 def : InstRW<[SPRWriteResGroup41, ReadDefault], (instregex "^(V?)CVT(T?)SS2SI64rr$")>;
924 def SPRWriteResGroup42 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06]> {
928 def : InstRW<[SPRWriteResGroup42], (instregex "^J(E|R)CXZ$")>;
929 def : InstRW<[SPRWriteResGroup42], (instrs CWD)>;
931 def SPRWriteResGroup43 : SchedWriteRes<[SPRPort00_01_05_06]>;
932 def : InstRW<[SPRWriteResGroup43], (instregex "^(LD|ST)_Frr$",
935 def : InstRW<[SPRWriteResGroup43], (instrs DEC16r_alt,
940 def SPRWriteResGroup44 : SchedWriteRes<[SPRPort00_06, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
943 def : InstRW<[SPRWriteResGroup44], (instrs DEC32r_alt)>;
945 def SPRWriteResGroup45 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
949 def : InstRW<[SPRWriteResGroup45], (instregex "^DIVR_F(32|64)m$")>;
951 def SPRWriteResGroup46 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
955 def : InstRW<[SPRWriteResGroup46], (instregex "^DIVR_FI(16|32)m$")>;
957 def SPRWriteResGroup47 : SchedWriteRes<[SPRPort00]> {
960 def : InstRW<[SPRWriteResGroup47], (instregex "^DIVR_F(P?)rST0$")>;
961 def : InstRW<[SPRWriteResGroup47], (instrs DIVR_FST0r)>;
963 def SPRWriteResGroup48 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
967 def : InstRW<[SPRWriteResGroup48, ReadAfterVecLd], (instregex "^(V?)DIVSDrm$")>;
968 def : InstRW<[SPRWriteResGroup48, ReadAfterVecLd], (instrs VDIVSDZrm)>;
970 def SPRWriteResGroup49 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
974 def : InstRW<[SPRWriteResGroup49], (instregex "^DIV_F(32|64)m$")>;
975 def : InstRW<[SPRWriteResGroup49, ReadAfterVecLd], (instregex "^VSQRTSHZm_Int((k|kz)?)$")>;
976 def : InstRW<[SPRWriteResGroup49, ReadAfterVecLd], (instrs VSQRTSHZm)>;
978 def SPRWriteResGroup50 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
982 def : InstRW<[SPRWriteResGroup50], (instregex "^DIV_FI(16|32)m$")>;
984 def SPRWriteResGroup51 : SchedWriteRes<[SPRPort00]> {
987 def : InstRW<[SPRWriteResGroup51], (instregex "^DIV_F(P?)rST0$")>;
988 def : InstRW<[SPRWriteResGroup51], (instrs DIV_FST0r)>;
990 def SPRWriteResGroup52 : SchedWriteRes<[SPRPort04, SPRPort04_09]>;
991 def : InstRW<[SPRWriteResGroup52], (instregex "^ENQCMD(S?)(16|32|64)$",
994 def : InstRW<[SPRWriteResGroup52], (instrs PUSHF32)>;
996 def SPRWriteResGroup53 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
997 let ReleaseAtCycles = [2, 21, 2, 14, 4, 9, 5];
999 let NumMicroOps = 57;
1001 def : InstRW<[SPRWriteResGroup53], (instrs ENTER)>;
1003 def SPRWriteResGroup54 : SchedWriteRes<[SPRPort04_09, SPRPort05, SPRPort07_08]> {
1005 let NumMicroOps = 3;
1007 def : InstRW<[SPRWriteResGroup54], (instregex "^(V?)EXTRACTPSmr$",
1008 "^VPMOVQDZ((256)?)mr$")>;
1009 def : InstRW<[SPRWriteResGroup54], (instrs SMSW16m,
1012 def SPRWriteResGroup55 : SchedWriteRes<[SPRPort00, SPRPort05]> {
1014 let NumMicroOps = 2;
1016 def : InstRW<[SPRWriteResGroup55], (instregex "^(V?)EXTRACTPSrr$")>;
1017 def : InstRW<[SPRWriteResGroup55], (instrs MMX_PEXTRWrr,
1021 def SPRWriteResGroup56 : SchedWriteRes<[SPRPort02_03, SPRPort02_03_11, SPRPort04, SPRPort04_09, SPRPort06]> {
1023 let NumMicroOps = 5;
1025 def : InstRW<[SPRWriteResGroup56], (instrs FARCALL64m)>;
1027 def SPRWriteResGroup57 : SchedWriteRes<[SPRPort02_03_11, SPRPort06]> {
1029 let NumMicroOps = 2;
1031 def : InstRW<[SPRWriteResGroup57], (instrs FARJMP64m,
1034 def SPRWriteResGroup58 : SchedWriteRes<[SPRPort04, SPRPort04_09]> {
1035 let NumMicroOps = 2;
1037 def : InstRW<[SPRWriteResGroup58], (instregex "^(V?)MASKMOVDQU((64)?)$",
1038 "^ST_FP(32|64|80)m$")>;
1039 def : InstRW<[SPRWriteResGroup58], (instrs FBSTPm,
1042 def SPRWriteResGroup59 : SchedWriteRes<[SPRPort00_05]> {
1043 let ReleaseAtCycles = [2];
1045 let NumMicroOps = 2;
1047 def : InstRW<[SPRWriteResGroup59], (instrs FDECSTP)>;
1049 def SPRWriteResGroup60 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
1050 let ReleaseAtCycles = [1, 2];
1052 let NumMicroOps = 3;
1054 def : InstRW<[SPRWriteResGroup60], (instregex "^FICOM(P?)(16|32)m$")>;
1055 def : InstRW<[SPRWriteResGroup60, ReadAfterVecYLd], (instregex "^VEXPANDP(D|S)Z((256)?)rm((k|kz)?)$",
1056 "^VPEXPAND(B|D|Q|W)Z((256)?)rm$",
1057 "^VPEXPAND(D|Q)Z((256)?)rmk(z?)$")>;
1059 def SPRWriteResGroup61 : SchedWriteRes<[SPRPort00_05]>;
1060 def : InstRW<[SPRWriteResGroup61], (instregex "^MMX_P(ADD|SUB)(B|D|Q|W)rr$",
1061 "^VP(ADD|SUB)(B|D|Q|W)Zrr$",
1062 "^VP(ADD|SUB)(D|Q)Zrrk(z?)$",
1063 "^VPTERNLOG(D|Q)Zrri((k|kz)?)$")>;
1064 def : InstRW<[SPRWriteResGroup61], (instrs FINCSTP,
1067 def SPRWriteResGroup62 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11]> {
1069 let NumMicroOps = 3;
1071 def : InstRW<[SPRWriteResGroup62], (instrs FLDCW16m)>;
1073 def SPRWriteResGroup63 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort00_06, SPRPort02_03, SPRPort02_03_11]> {
1074 let ReleaseAtCycles = [2, 5, 10, 39, 8];
1076 let NumMicroOps = 64;
1078 def : InstRW<[SPRWriteResGroup63], (instrs FLDENVm)>;
1080 def SPRWriteResGroup64 : SchedWriteRes<[SPRPort00_01_05_06]> {
1081 let ReleaseAtCycles = [4];
1083 let NumMicroOps = 4;
1085 def : InstRW<[SPRWriteResGroup64], (instrs FNCLEX)>;
1087 def SPRWriteResGroup65 : SchedWriteRes<[SPRPort00_01_05_06, SPRPort00_05, SPRPort05]> {
1088 let ReleaseAtCycles = [6, 3, 6];
1090 let NumMicroOps = 15;
1092 def : InstRW<[SPRWriteResGroup65], (instrs FNINIT)>;
1094 def SPRWriteResGroup66 : SchedWriteRes<[SPRPort04, SPRPort04_09, SPRPort06]> {
1096 let NumMicroOps = 3;
1098 def : InstRW<[SPRWriteResGroup66], (instrs FNSTCW16m)>;
1100 def SPRWriteResGroup67 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06]> {
1102 let NumMicroOps = 2;
1104 def : InstRW<[SPRWriteResGroup67], (instrs FNSTSW16r)>;
1106 def SPRWriteResGroup68 : SchedWriteRes<[SPRPort00, SPRPort04, SPRPort04_09]> {
1108 let NumMicroOps = 3;
1110 def : InstRW<[SPRWriteResGroup68], (instrs FNSTSWm)>;
1112 def SPRWriteResGroup69 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06, SPRPort00_06, SPRPort01, SPRPort04, SPRPort04_09, SPRPort05, SPRPort06]> {
1113 let ReleaseAtCycles = [9, 11, 21, 1, 30, 11, 16, 1];
1115 let NumMicroOps = 100;
1117 def : InstRW<[SPRWriteResGroup69], (instrs FSTENVm)>;
1119 def SPRWriteResGroup70 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort00_06, SPRPort01_05, SPRPort02_03, SPRPort02_03_11, SPRPort06]> {
1120 let ReleaseAtCycles = [4, 1, 2, 1, 47, 33, 2];
1122 let NumMicroOps = 90;
1124 def : InstRW<[SPRWriteResGroup70], (instrs FXRSTOR)>;
1126 def SPRWriteResGroup71 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort00_06, SPRPort01_05, SPRPort02_03, SPRPort02_03_11, SPRPort06]> {
1127 let ReleaseAtCycles = [4, 1, 2, 1, 45, 31, 4];
1129 let NumMicroOps = 88;
1131 def : InstRW<[SPRWriteResGroup71], (instrs FXRSTOR64)>;
1133 def SPRWriteResGroup72 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1134 let ReleaseAtCycles = [2, 5, 10, 10, 2, 38, 5, 38];
1135 let Latency = SapphireRapidsModel.MaxLatency;
1136 let NumMicroOps = 110;
1138 def : InstRW<[SPRWriteResGroup72], (instregex "^FXSAVE((64)?)$")>;
1140 def SPRWriteResGroup73 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
1142 let NumMicroOps = 2;
1144 def : InstRW<[SPRWriteResGroup73], (instregex "^VPLZCNT(D|Q)Z256rm((b|k|bk|kz)?)$",
1145 "^VPLZCNT(D|Q)Z256rmbkz$")>;
1146 def : InstRW<[SPRWriteResGroup73, ReadAfterVecXLd], (instregex "^(V?)GF2P8AFFINE((INV)?)QBrmi$",
1147 "^(V?)GF2P8MULBrm$",
1148 "^V(ADD|SUB)PHZ128rm((b|k|bk|kz)?)$",
1149 "^V(ADD|SUB)PHZ128rmbkz$",
1150 "^VGETEXPPHZ128m((b|k|bk|kz)?)$",
1151 "^VGETEXPSHZm((k|kz)?)$",
1152 "^VGETMANTPHZ128rm(bi|ik)$",
1153 "^VGETMANTPHZ128rmbik(z?)$",
1154 "^VGETMANTPHZ128rmi((kz)?)$",
1155 "^VGETMANTSHZrmi((k|kz)?)$",
1156 "^VGF2P8AFFINE((INV)?)QBZ128rm(b?)i$",
1157 "^VM(AX|IN)CPHZ128rm((b|k|bk|kz)?)$",
1158 "^VM(AX|IN)CPHZ128rmbkz$",
1159 "^VM(AX|IN|UL)PHZ128rm((b|k|bk|kz)?)$",
1160 "^VM(AX|IN|UL)PHZ128rmbkz$")>;
1161 def : InstRW<[SPRWriteResGroup73, ReadAfterVecXLd], (instrs VGETEXPPHZ128mbkz,
1163 def : InstRW<[SPRWriteResGroup73, ReadAfterVecLd], (instregex "^V(ADD|SUB)SHZrm$",
1164 "^V(ADD|SUB)SHZrm_Int((k|kz)?)$",
1165 "^VCVTSH2SSZrm((_Int)?)$",
1166 "^VM(AX|IN)CSHZrm$",
1167 "^VM(AX|IN|UL)SHZrm$",
1168 "^VM(AX|IN|UL)SHZrm_Int((k|kz)?)$")>;
1169 def : InstRW<[SPRWriteResGroup73, ReadAfterVecYLd], (instregex "^VGF2P8AFFINE((INV)?)QBYrmi$",
1170 "^VGF2P8AFFINE((INV)?)QBZ256rm(b?)i$",
1171 "^VGF2P8MULB(Y|Z256)rm$")>;
1172 def : InstRW<[SPRWriteResGroup73, ReadAfterVecXLd, ReadAfterVecXLd], (instregex "^VF(N?)M(ADD|SUB)(132|213|231)PHZ128m((b|k|bk|kz)?)$",
1173 "^VF(N?)M(ADD|SUB)(132|213|231)PHZ128mbkz$",
1174 "^VFMADDSUB(132|213|231)PHZ128m((b|k|bk|kz)?)$",
1175 "^VFMADDSUB(132|213|231)PHZ128mbkz$",
1176 "^VFMSUBADD(132|213|231)PHZ128m((b|k|bk|kz)?)$",
1177 "^VFMSUBADD(132|213|231)PHZ128mbkz$")>;
1178 def : InstRW<[SPRWriteResGroup73, ReadAfterVecLd, ReadAfterVecLd], (instregex "^VF(N?)M(ADD|SUB)(132|213|231)SHZm$",
1179 "^VF(N?)M(ADD|SUB)(132|213|231)SHZm_Int((k|kz)?)$")>;
1180 def : InstRW<[SPRWriteResGroup73, ReadAfterVecYLd, ReadAfterVecYLd], (instregex "^VPMADD52(H|L)UQZ256m((b|k|bk|kz)?)$",
1181 "^VPMADD52(H|L)UQZ256mbkz$")>;
1183 def SPRWriteResGroup74 : SchedWriteRes<[SPRPort00_01]> {
1186 def : InstRW<[SPRWriteResGroup74], (instregex "^(V?)GF2P8MULBrr$",
1187 "^V(ADD|SUB)PHZ(128|256)rr$",
1188 "^V(ADD|SUB)SHZrr$",
1189 "^V(ADD|SUB)SHZrr(b?)_Int$",
1190 "^VCVT(T?)PH2(U?)WZ(128|256)rr$",
1191 "^VCVTSH2SSZrr(b?)_Int$",
1192 "^VCVT(U?)W2PHZ(128|256)rr$",
1193 "^VF(N?)M(ADD|SUB)(132|213|231)PHZ(128|256)r$",
1194 "^VF(N?)M(ADD|SUB)(132|213|231)SHZr(b?)((_Int)?)$",
1195 "^VFMADDSUB(132|213|231)PHZ(128|256)r$",
1196 "^VFMSUBADD(132|213|231)PHZ(128|256)r$",
1197 "^VGETEXPPHZ(128|256)r$",
1198 "^VGETEXPSHZr(b?)$",
1199 "^VGETMANTPHZ(128|256)rri$",
1200 "^VGETMANTSHZrri(b?)$",
1201 "^VGF2P8MULBZ(128|256)rr$",
1202 "^VM(AX|IN)CPHZ(128|256)rr$",
1203 "^VM(AX|IN)CSHZrr$",
1204 "^VM(AX|IN|UL)PHZ(128|256)rr$",
1205 "^VM(AX|IN|UL)SHZrr$",
1206 "^VM(AX|IN|UL)SHZrr(b?)_Int$")>;
1207 def : InstRW<[SPRWriteResGroup74], (instrs VCVTSH2SSZrr,
1210 def SPRWriteResGroup75 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort02_03_11, SPRPort05]> {
1211 let ReleaseAtCycles = [7, 5, 26, 19, 2, 7, 21];
1213 let NumMicroOps = 87;
1215 def : InstRW<[SPRWriteResGroup75], (instrs IN16ri)>;
1217 def SPRWriteResGroup76 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort02_03_11, SPRPort05]> {
1218 let ReleaseAtCycles = [7, 1, 4, 26, 19, 3, 7, 20];
1220 let NumMicroOps = 87;
1222 def : InstRW<[SPRWriteResGroup76], (instrs IN16rr)>;
1224 def SPRWriteResGroup77 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort02_03_11, SPRPort05]> {
1225 let ReleaseAtCycles = [7, 6, 28, 21, 2, 10, 20];
1227 let NumMicroOps = 94;
1229 def : InstRW<[SPRWriteResGroup77], (instrs IN32ri)>;
1231 def SPRWriteResGroup78 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort02_03_11, SPRPort05]> {
1232 let ReleaseAtCycles = [7, 9, 28, 21, 2, 11, 21];
1233 let NumMicroOps = 99;
1235 def : InstRW<[SPRWriteResGroup78], (instrs IN32rr)>;
1237 def SPRWriteResGroup79 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort02_03_11, SPRPort05]> {
1238 let ReleaseAtCycles = [7, 6, 25, 19, 2, 8, 20];
1240 let NumMicroOps = 87;
1242 def : InstRW<[SPRWriteResGroup79], (instrs IN8ri)>;
1244 def SPRWriteResGroup80 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort02_03_11, SPRPort05]> {
1245 let ReleaseAtCycles = [7, 6, 25, 19, 2, 7, 20];
1247 let NumMicroOps = 86;
1249 def : InstRW<[SPRWriteResGroup80], (instrs IN8rr)>;
1251 def SPRWriteResGroup81 : SchedWriteRes<[SPRPort00_06]> {
1252 let NumMicroOps = 4;
1254 def : InstRW<[SPRWriteResGroup81], (instrs INC16r_alt)>;
1256 def SPRWriteResGroup82 : SchedWriteRes<[SPRPort02_03_11]> {
1259 def : InstRW<[SPRWriteResGroup82], (instregex "^LD_F(32|64|80)m$",
1260 "^(V?)MOV(D|SH|SL)DUPrm$",
1261 "^VBROADCASTSS((Z128)?)rm$",
1262 "^VMOV(D|SH|SL)DUPZ128rm$",
1263 "^VPBROADCAST(D|Q)((Z128)?)rm$")>;
1264 def : InstRW<[SPRWriteResGroup82], (instrs INC32r_alt,
1265 VBROADCASTI32X2Z128rm)>;
1267 def SPRWriteResGroup83 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1268 let ReleaseAtCycles = [7, 6, 24, 17, 8, 1, 19, 1];
1270 let NumMicroOps = 83;
1272 def : InstRW<[SPRWriteResGroup83], (instrs INSB)>;
1274 def SPRWriteResGroup84 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort00_01_05_06_10, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1275 let ReleaseAtCycles = [7, 1, 5, 1, 27, 17, 11, 1, 21, 1];
1277 let NumMicroOps = 92;
1279 def : InstRW<[SPRWriteResGroup84], (instrs INSL)>;
1281 def SPRWriteResGroup85 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort00_01_05_06_10, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1282 let ReleaseAtCycles = [7, 1, 4, 1, 25, 17, 1, 9, 1, 19, 1];
1284 let NumMicroOps = 86;
1286 def : InstRW<[SPRWriteResGroup85], (instrs INSW)>;
1288 def SPRWriteResGroup86 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1289 let ReleaseAtCycles = [5, 4, 8, 6, 2, 5, 7, 5];
1290 let Latency = SapphireRapidsModel.MaxLatency;
1291 let NumMicroOps = 42;
1293 def : InstRW<[SPRWriteResGroup86], (instrs INVLPG)>;
1295 def SPRWriteResGroup87 : SchedWriteRes<[SPRPort04, SPRPort04_09, SPRPort05]> {
1297 let NumMicroOps = 3;
1299 def : InstRW<[SPRWriteResGroup87], (instregex "^IST(T?)_FP(16|32|64)m$",
1300 "^IST_F(16|32)m$")>;
1302 def SPRWriteResGroup88 : SchedWriteRes<[SPRPort00_01_05_06, SPRPort00_06]> {
1304 let NumMicroOps = 2;
1306 def : InstRW<[SPRWriteResGroup88], (instrs JCXZ)>;
1308 def SPRWriteResGroup89 : SchedWriteRes<[SPRPort06]>;
1309 def : InstRW<[SPRWriteResGroup89], (instrs JMP64r_REX)>;
1311 def SPRWriteResGroup90 : SchedWriteRes<[]> {
1313 let NumMicroOps = 0;
1315 def : InstRW<[SPRWriteResGroup90], (instregex "^JMP_(1|4)$")>;
1316 def : InstRW<[SPRWriteResGroup90], (instrs VZEROUPPER)>;
1318 def SPRWriteResGroup91 : SchedWriteRes<[SPRPort05]> {
1321 def : InstRW<[SPRWriteResGroup91], (instregex "^KADD(B|D|Q|W)rr$",
1322 "^KSHIFT(LB|RD|RQ|RW)ri$",
1323 "^KSHIFT(LD|RB)ri$",
1325 "^KUNPCK(BW|DQ|WD)rr$")>;
1327 def SPRWriteResGroup92 : SchedWriteRes<[SPRPort00]>;
1328 def : InstRW<[SPRWriteResGroup92], (instregex "^KAND(B|D|Q|W|ND|NQ|NW)rr$",
1329 "^KMOV(B|D|Q|W)kk$",
1330 "^KNOT(B|D|Q|W)rr$",
1331 "^K((X|XN)?)OR(B|D|Q|W)rr$",
1333 "^VPABS(D|Q|W)Zrr$",
1334 "^VPABS(D|Q)Zrrk(z?)$",
1335 "^VPADD(U?)S(B|W)Zrr$",
1337 "^VPM(AX|IN)(SB|UD|UW)Zrr$",
1338 "^VPM(AX|IN)(SD|UB)Zrr$",
1339 "^VPM(AX|IN)(S|U)DZrrk(z?)$",
1340 "^VPM(AX|IN)SWZrr$",
1341 "^VPSH(L|R)D(D|Q|W)Zrri$",
1342 "^VPSH(L|R)DV(D|Q|W)Zr$",
1343 "^VPSH(L|R)DV(D|Q)Zrk(z?)$",
1344 "^VPSUB(U?)SWZrr$")>;
1345 def : InstRW<[SPRWriteResGroup92], (instrs KANDNBrr,
1348 def SPRWriteResGroup93 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
1350 let NumMicroOps = 2;
1352 def : InstRW<[SPRWriteResGroup93], (instregex "^KMOV(B|D|Q|W)km$")>;
1354 def SPRWriteResGroup94 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
1356 let NumMicroOps = 2;
1358 def : InstRW<[SPRWriteResGroup94], (instregex "^MOV8m(i|r)$")>;
1359 def : InstRW<[SPRWriteResGroup94], (instrs KMOVBmk,
1362 def SPRWriteResGroup95 : SchedWriteRes<[SPRPort05]>;
1363 def : InstRW<[SPRWriteResGroup95], (instregex "^(V?)PALIGNRrri$",
1364 "^VALIGN(D|Q)Z128rri((k|kz)?)$",
1365 "^VBROADCASTSSZ128rr((k|kz)?)$",
1366 "^VPALIGNR(Y|Z)rri$",
1367 "^VPALIGNRZ(128|256)rri$",
1368 "^VPBROADCAST(B|D|Q|W)rr$",
1369 "^VPSHUF(D|HW|LW)Zri$",
1370 "^VPSHUFDZrik(z?)$",
1372 "^VPUNPCK(H|L)(BW|WD)Zrr$",
1373 "^VPUNPCK(H|L|LQ)DQZrr((k|kz)?)$",
1374 "^VPUNPCKHQDQZrr((k|kz)?)$")>;
1375 def : InstRW<[SPRWriteResGroup95], (instrs KMOVQkr,
1378 def SPRWriteResGroup96 : SchedWriteRes<[SPRPort00]> {
1381 def : InstRW<[SPRWriteResGroup96], (instregex "^K((OR)?)TEST(B|D|Q|W)rr$",
1382 "^VP(A|SU)BS(B|W)Zrrk(z?)$",
1383 "^VPADD(U?)S(B|W)Zrrk(z?)$",
1384 "^VPAVG(B|W)Zrrk(z?)$",
1385 "^VPM(AX|IN)(SB|UW)Zrrk(z?)$",
1386 "^VPM(AX|IN)(SW|UB)Zrrk(z?)$",
1387 "^VPSH(L|R)DVWZrk(z?)$",
1388 "^VPS(L|R)LVWZrrk(z?)$",
1389 "^VPS(L|R)LWZrik(z?)$",
1390 "^VPSRAVWZrrk(z?)$",
1392 "^VPSUBUS(B|W)Zrrk(z?)$")>;
1393 def : InstRW<[SPRWriteResGroup96], (instrs VMOVSDto64Zrr)>;
1395 def SPRWriteResGroup97 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05]> {
1396 let ReleaseAtCycles = [8, 2, 14, 3, 1];
1398 let NumMicroOps = 81;
1400 def : InstRW<[SPRWriteResGroup97], (instrs LAR16rm)>;
1402 def SPRWriteResGroup98 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
1403 let ReleaseAtCycles = [1, 3, 1, 8, 5, 1, 2, 1];
1405 let NumMicroOps = 22;
1407 def : InstRW<[SPRWriteResGroup98], (instrs LAR16rr)>;
1409 def SPRWriteResGroup99 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05]> {
1410 let ReleaseAtCycles = [1, 2, 2, 9, 5, 3, 1];
1412 let NumMicroOps = 85;
1414 def : InstRW<[SPRWriteResGroup99], (instrs LAR32rm)>;
1416 def SPRWriteResGroup100 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
1417 let ReleaseAtCycles = [1, 3, 1, 8, 5, 1, 2, 1];
1419 let NumMicroOps = 22;
1421 def : InstRW<[SPRWriteResGroup100], (instregex "^LAR(32|64)rr$")>;
1423 def SPRWriteResGroup101 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05]> {
1424 let ReleaseAtCycles = [1, 2, 2, 9, 5, 3, 1];
1426 let NumMicroOps = 87;
1428 def : InstRW<[SPRWriteResGroup101], (instrs LAR64rm)>;
1430 def SPRWriteResGroup102 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort01]> {
1432 let NumMicroOps = 2;
1434 def : InstRW<[SPRWriteResGroup102], (instrs LEA16r)>;
1436 def SPRWriteResGroup103 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
1437 let ReleaseAtCycles = [3, 1];
1439 let NumMicroOps = 4;
1441 def : InstRW<[SPRWriteResGroup103], (instregex "^LODS(B|W)$",
1442 "^SCAS(B|L|Q|W)$")>;
1443 def : InstRW<[SPRWriteResGroup103], (instrs LEAVE)>;
1445 def SPRWriteResGroup104 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
1446 let ReleaseAtCycles = [2, 1];
1448 let NumMicroOps = 3;
1450 def : InstRW<[SPRWriteResGroup104], (instrs LEAVE64)>;
1452 def SPRWriteResGroup105 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
1453 let ReleaseAtCycles = [1, 2, 4, 3, 2, 1, 1];
1454 let Latency = SapphireRapidsModel.MaxLatency;
1455 let NumMicroOps = 14;
1457 def : InstRW<[SPRWriteResGroup105], (instrs LGDT64m)>;
1459 def SPRWriteResGroup106 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
1460 let ReleaseAtCycles = [1, 1, 5, 3, 2, 1, 1];
1461 let Latency = SapphireRapidsModel.MaxLatency;
1462 let NumMicroOps = 14;
1464 def : InstRW<[SPRWriteResGroup106], (instrs LIDT64m)>;
1466 def SPRWriteResGroup107 : SchedWriteRes<[SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
1467 let ReleaseAtCycles = [5, 3, 2, 1, 1];
1468 let Latency = SapphireRapidsModel.MaxLatency;
1469 let NumMicroOps = 12;
1471 def : InstRW<[SPRWriteResGroup107], (instrs LLDT16m)>;
1473 def SPRWriteResGroup108 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
1474 let ReleaseAtCycles = [1, 4, 3, 1, 1, 1];
1475 let Latency = SapphireRapidsModel.MaxLatency;
1476 let NumMicroOps = 11;
1478 def : InstRW<[SPRWriteResGroup108], (instrs LLDT16r)>;
1480 def SPRWriteResGroup109 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1481 let ReleaseAtCycles = [1, 1, 2, 8, 3, 1, 2, 7, 2];
1482 let Latency = SapphireRapidsModel.MaxLatency;
1483 let NumMicroOps = 27;
1485 def : InstRW<[SPRWriteResGroup109], (instrs LMSW16m)>;
1487 def SPRWriteResGroup110 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1488 let ReleaseAtCycles = [5, 7, 1, 2, 5, 2];
1489 let Latency = SapphireRapidsModel.MaxLatency;
1490 let NumMicroOps = 22;
1492 def : InstRW<[SPRWriteResGroup110], (instrs LMSW16r)>;
1494 def SPRWriteResGroup111 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
1495 let ReleaseAtCycles = [2, 1];
1497 let NumMicroOps = 3;
1499 def : InstRW<[SPRWriteResGroup111], (instregex "^LODS(L|Q)$")>;
1501 def SPRWriteResGroup112 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
1502 let ReleaseAtCycles = [2, 4, 1];
1504 let NumMicroOps = 7;
1506 def : InstRW<[SPRWriteResGroup112], (instrs LOOP)>;
1508 def SPRWriteResGroup113 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
1509 let ReleaseAtCycles = [4, 6, 1];
1511 let NumMicroOps = 11;
1513 def : InstRW<[SPRWriteResGroup113], (instrs LOOPE)>;
1515 def SPRWriteResGroup114 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
1516 let ReleaseAtCycles = [4, 6, 1];
1518 let NumMicroOps = 11;
1520 def : InstRW<[SPRWriteResGroup114], (instrs LOOPNE)>;
1522 def SPRWriteResGroup115 : SchedWriteRes<[SPRPort02_03, SPRPort02_03_11, SPRPort06]> {
1524 let NumMicroOps = 3;
1526 def : InstRW<[SPRWriteResGroup115], (instrs LRET64)>;
1528 def SPRWriteResGroup116 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05]> {
1529 let ReleaseAtCycles = [1, 5, 3, 3, 1];
1531 let NumMicroOps = 13;
1533 def : InstRW<[SPRWriteResGroup116], (instregex "^LSL(16|32|64)rm$")>;
1535 def SPRWriteResGroup117 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05]> {
1536 let ReleaseAtCycles = [1, 4, 4, 3, 2, 1];
1538 let NumMicroOps = 15;
1540 def : InstRW<[SPRWriteResGroup117], (instregex "^LSL(16|32|64)rr$")>;
1542 def SPRWriteResGroup118 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
1544 let NumMicroOps = 3;
1546 def : InstRW<[SPRWriteResGroup118], (instregex "^MMX_CVT(T?)PD2PIrm$")>;
1548 def SPRWriteResGroup119 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
1550 let NumMicroOps = 2;
1552 def : InstRW<[SPRWriteResGroup119], (instregex "^MMX_CVT(T?)PD2PIrr$",
1553 "^VCVT(T?)PH2(U?)DQZ(128|256)rr$",
1554 "^VCVTP(H2PS|S2PH)XZ256rr$")>;
1556 def SPRWriteResGroup120 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
1558 let NumMicroOps = 2;
1560 def : InstRW<[SPRWriteResGroup120], (instregex "^VCVTP(H2PS|S2PH)XZ128rr$",
1561 "^VPERMWZ(128|256)rrk(z?)$",
1562 "^VPS(L|R)LWZ256rrk(z?)$",
1563 "^VPSRAWZ256rrk(z?)$")>;
1564 def : InstRW<[SPRWriteResGroup120], (instrs MMX_CVTPI2PDrr)>;
1566 def SPRWriteResGroup121 : SchedWriteRes<[SPRPort00, SPRPort00_01]> {
1568 let NumMicroOps = 2;
1570 def : InstRW<[SPRWriteResGroup121], (instrs MMX_CVTPI2PSrr)>;
1572 def SPRWriteResGroup122 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
1574 let NumMicroOps = 2;
1576 def : InstRW<[SPRWriteResGroup122], (instregex "^MMX_CVT(T?)PS2PIrm$")>;
1578 def SPRWriteResGroup123 : SchedWriteRes<[SPRPort00, SPRPort00_01_05]> {
1580 let NumMicroOps = 2;
1582 def : InstRW<[SPRWriteResGroup123], (instregex "^MMX_CVT(T?)PS2PIrr$")>;
1584 def SPRWriteResGroup124 : SchedWriteRes<[SPRPort00, SPRPort04_09, SPRPort07_08]> {
1585 let ReleaseAtCycles = [2, 1, 1];
1587 let NumMicroOps = 4;
1589 def : InstRW<[SPRWriteResGroup124], (instregex "^MMX_MASKMOVQ((64)?)$")>;
1591 def SPRWriteResGroup125 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
1593 let NumMicroOps = 2;
1595 def : InstRW<[SPRWriteResGroup125], (instregex "^VMOV(W|SHZ)mr$")>;
1596 def : InstRW<[SPRWriteResGroup125], (instrs MMX_MOVD64mr)>;
1598 def SPRWriteResGroup126 : SchedWriteRes<[SPRPort02_03_11]> {
1601 def : InstRW<[SPRWriteResGroup126], (instregex "^MMX_MOV(D|Q)64rm$",
1602 "^VBROADCAST(F|I)128rm$",
1603 "^VBROADCAST(F|I)32X(2|4)Z256rm$",
1604 "^VBROADCAST(F|I)32X(8|2Z)rm$",
1605 "^VBROADCAST(F|I)(32|64)X4rm$",
1606 "^VBROADCAST(F|I)64X2((Z128)?)rm$",
1607 "^VBROADCASTS(DY|SZ)rm$",
1608 "^VBROADCASTS(D|S)Z256rm$",
1609 "^VBROADCASTS(DZ|SY)rm$",
1610 "^VMOV(D|SH|SL)DUP(Y|Z)rm$",
1611 "^VMOV(D|SH|SL)DUPZ256rm$",
1612 "^VPBROADCAST(DY|QZ)rm$",
1613 "^VPBROADCAST(D|Q)Z256rm$",
1614 "^VPBROADCAST(DZ|QY)rm$")>;
1615 def : InstRW<[SPRWriteResGroup126], (instrs MMX_MOVD64to64rm)>;
1617 def SPRWriteResGroup127 : SchedWriteRes<[SPRPort00_01_05, SPRPort00_05]> {
1619 let NumMicroOps = 2;
1621 def : InstRW<[SPRWriteResGroup127], (instregex "^MMX_MOV(DQ|FR64)2Qrr$")>;
1623 def SPRWriteResGroup128 : SchedWriteRes<[SPRPort00, SPRPort00_01_05]> {
1625 let NumMicroOps = 2;
1627 def : InstRW<[SPRWriteResGroup128], (instregex "^MMX_MOVQ2(DQ|FR64)rr$")>;
1629 def SPRWriteResGroup129 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
1630 let ReleaseAtCycles = [1, 2];
1632 let NumMicroOps = 3;
1634 def : InstRW<[SPRWriteResGroup129, ReadAfterVecLd], (instregex "^MMX_PACKSS(DW|WB)rm$")>;
1635 def : InstRW<[SPRWriteResGroup129, ReadAfterVecLd], (instrs MMX_PACKUSWBrm)>;
1637 def SPRWriteResGroup130 : SchedWriteRes<[SPRPort05]> {
1638 let ReleaseAtCycles = [2];
1640 let NumMicroOps = 2;
1642 def : InstRW<[SPRWriteResGroup130], (instregex "^MMX_PACKSS(DW|WB)rr$",
1643 "^VPMOV(D|Q|W|SQ|SW)BZrr$",
1644 "^VPMOV((S|US)?)(D|Q)WZrr$",
1645 "^VPMOV(U?)S(DB|QD)Zrr$",
1646 "^VPMOV(U?)SQDZrrk(z?)$",
1647 "^VPMOVUS(Q|W)BZrr$")>;
1648 def : InstRW<[SPRWriteResGroup130], (instrs MMX_PACKUSWBrr)>;
1649 def : InstRW<[SPRWriteResGroup130, ReadDefault, ReadInt2Fpu], (instrs MMX_PINSRWrr)>;
1651 def SPRWriteResGroup131 : SchedWriteRes<[SPRPort00_05, SPRPort02_03_11]> {
1653 let NumMicroOps = 2;
1655 def : InstRW<[SPRWriteResGroup131], (instregex "^VBROADCAST(F|I)32X(8|2Z)rmk(z?)$",
1656 "^VBROADCAST(F|I)(32|64)X4rmk(z?)$",
1657 "^VBROADCAST(F|I)64X2rmk(z?)$",
1658 "^VBROADCASTS(D|S)Zrmk(z?)$",
1659 "^VMOV(A|U)P(D|S)Zrmk(z?)$",
1660 "^VMOV(D|SH|SL)DUPZrmk(z?)$",
1661 "^VMOVDQ(A|U)(32|64)Zrmk(z?)$",
1662 "^VPBROADCAST(D|Q)Zrmk(z?)$")>;
1663 def : InstRW<[SPRWriteResGroup131, ReadAfterVecLd], (instregex "^MMX_P(ADD|SUB)(B|D|Q|W)rm$")>;
1664 def : InstRW<[SPRWriteResGroup131, ReadAfterVecYLd], (instregex "^VINSERT(F|I)(32|64)x4Zrm((k|kz)?)$",
1665 "^VINSERT(F|I)(32x8|64x2)Zrm((k|kz)?)$",
1666 "^VP(ADD|SUB)(B|D|Q|W)Zrm$",
1667 "^VP(ADD|SUB)(D|Q)Zrm(b|k|kz)$",
1668 "^VP(ADD|SUB)(D|Q)Zrmbk(z?)$",
1669 "^VPTERNLOG(D|Q)Zrm(bi|ik)$",
1670 "^VPTERNLOG(D|Q)Zrmbik(z?)$",
1671 "^VPTERNLOG(D|Q)Zrmi((kz)?)$")>;
1673 def SPRWriteResGroup132 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
1674 let ReleaseAtCycles = [1, 1, 2];
1676 let NumMicroOps = 4;
1678 def : InstRW<[SPRWriteResGroup132, ReadAfterVecLd], (instregex "^MMX_PH(ADD|SUB)SWrm$")>;
1680 def SPRWriteResGroup133 : SchedWriteRes<[SPRPort00, SPRPort05]> {
1681 let ReleaseAtCycles = [1, 2];
1683 let NumMicroOps = 3;
1685 def : InstRW<[SPRWriteResGroup133], (instregex "^MMX_PH(ADD|SUB)SWrr$")>;
1687 def SPRWriteResGroup134 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
1689 let NumMicroOps = 2;
1691 def : InstRW<[SPRWriteResGroup134], (instregex "^VPBROADCAST(BY|WZ)rm$",
1692 "^VPBROADCAST(B|W)Z256rm$",
1693 "^VPBROADCAST(BZ|WY)rm$")>;
1694 def : InstRW<[SPRWriteResGroup134, ReadAfterLd], (instrs MMX_PINSRWrm)>;
1695 def : InstRW<[SPRWriteResGroup134, ReadAfterVecXLd], (instregex "^VFPCLASSP(D|S)Z128rm$")>;
1696 def : InstRW<[SPRWriteResGroup134, ReadAfterVecLd], (instregex "^VFPCLASSS(D|H|S)Zrm$")>;
1697 def : InstRW<[SPRWriteResGroup134, ReadAfterVecYLd], (instregex "^VPALIGNR(Y|Z256)rmi$")>;
1698 def : InstRW<[SPRWriteResGroup134, ReadAfterVecYLd], (instrs VPSHUFBZrm)>;
1700 def SPRWriteResGroup135 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
1702 let NumMicroOps = 2;
1704 def : InstRW<[SPRWriteResGroup135], (instregex "^MOV16ao(16|32|64)$")>;
1706 def SPRWriteResGroup136 : SchedWriteRes<[SPRPort01, SPRPort04_09, SPRPort07_08]> {
1708 let NumMicroOps = 3;
1710 def : InstRW<[SPRWriteResGroup136], (instregex "^PUSH(F|G)S(16|32)$")>;
1711 def : InstRW<[SPRWriteResGroup136], (instrs MOV16ms,
1714 def SPRWriteResGroup137 : SchedWriteRes<[SPRPort00_01_05_06_10]>;
1715 def : InstRW<[SPRWriteResGroup137], (instregex "^MOV(8|16|32|64)ri$",
1716 "^MOV(8|16|32)ri_alt$",
1717 "^MOV(8|16)rr((_REV)?)$")>;
1718 def : InstRW<[SPRWriteResGroup137], (instrs MOV64ri32,
1721 def SPRWriteResGroup138 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort01]> {
1722 let NumMicroOps = 2;
1724 def : InstRW<[SPRWriteResGroup138], (instregex "^MOV(16|32|64)rs$",
1727 def SPRWriteResGroup139 : SchedWriteRes<[SPRPort02_03_11]>;
1728 def : InstRW<[SPRWriteResGroup139], (instregex "^MOV32ao(16|32|64)$")>;
1729 def : InstRW<[SPRWriteResGroup139], (instrs MOV64ao64)>;
1731 def SPRWriteResGroup140 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
1732 let NumMicroOps = 3;
1734 def : InstRW<[SPRWriteResGroup140], (instregex "^MOV(8|32)o(16|32)a$",
1735 "^MOV(8|32|64)o64a$")>;
1737 def SPRWriteResGroup141 : SchedWriteRes<[SPRPort00_01_05_06_10]> {
1740 def : InstRW<[SPRWriteResGroup141], (instregex "^MOV32rr((_REV)?)$",
1741 "^MOVZX(32|64)rr8$")>;
1742 def : InstRW<[SPRWriteResGroup141], (instrs MOVZX32rr8_NOREX)>;
1744 def SPRWriteResGroup142 : SchedWriteRes<[SPRPort02_03_11]> {
1747 def : InstRW<[SPRWriteResGroup142], (instrs MOV64ao32)>;
1749 def SPRWriteResGroup143 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1750 let ReleaseAtCycles = [1, 2, 4, 16, 7, 2, 2, 12, 2];
1752 let NumMicroOps = 48;
1754 def : InstRW<[SPRWriteResGroup143], (instrs MOV64dr)>;
1756 def SPRWriteResGroup144 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
1758 let NumMicroOps = 2;
1760 def : InstRW<[SPRWriteResGroup144], (instrs MOV64o32a)>;
1762 def SPRWriteResGroup145 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort05]> {
1763 let Latency = SapphireRapidsModel.MaxLatency;
1764 let NumMicroOps = 3;
1766 def : InstRW<[SPRWriteResGroup145], (instrs MOV64rc)>;
1768 def SPRWriteResGroup146 : SchedWriteRes<[SPRPort00_01_05, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort05]> {
1769 let ReleaseAtCycles = [3, 4, 8, 4, 2, 3];
1771 let NumMicroOps = 24;
1773 def : InstRW<[SPRWriteResGroup146], (instrs MOV64rd)>;
1775 def SPRWriteResGroup147 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
1776 let NumMicroOps = 2;
1778 def : InstRW<[SPRWriteResGroup147], (instregex "^MOV8ao(16|32|64)$")>;
1780 def SPRWriteResGroup148 : SchedWriteRes<[SPRPort00_06, SPRPort04_09, SPRPort07_08]> {
1782 let NumMicroOps = 3;
1784 def : InstRW<[SPRWriteResGroup148], (instrs MOVBE16mr)>;
1786 def SPRWriteResGroup149 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort02_03_11]> {
1788 let NumMicroOps = 3;
1790 def : InstRW<[SPRWriteResGroup149], (instrs MOVBE16rm)>;
1792 def SPRWriteResGroup150 : SchedWriteRes<[SPRPort01, SPRPort02_03_11]> {
1794 let NumMicroOps = 2;
1796 def : InstRW<[SPRWriteResGroup150], (instrs MOVBE32rm)>;
1798 def SPRWriteResGroup151 : SchedWriteRes<[SPRPort00_06, SPRPort01, SPRPort04_09, SPRPort07_08]> {
1800 let NumMicroOps = 4;
1802 def : InstRW<[SPRWriteResGroup151], (instrs MOVBE64mr,
1807 def SPRWriteResGroup152 : SchedWriteRes<[SPRPort00_06, SPRPort01, SPRPort02_03_11]> {
1809 let NumMicroOps = 3;
1811 def : InstRW<[SPRWriteResGroup152], (instrs MOVBE64rm)>;
1813 def SPRWriteResGroup153 : SchedWriteRes<[SPRPort00_06, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
1814 let NumMicroOps = 4;
1816 def : InstRW<[SPRWriteResGroup153], (instregex "^MOVDIR64B(16|32|64)$")>;
1818 def SPRWriteResGroup154 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
1820 let NumMicroOps = 2;
1822 def : InstRW<[SPRWriteResGroup154], (instrs MOVDIRI32)>;
1824 def SPRWriteResGroup155 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
1826 let NumMicroOps = 2;
1828 def : InstRW<[SPRWriteResGroup155], (instrs MOVDIRI64)>;
1830 def SPRWriteResGroup156 : SchedWriteRes<[SPRPort01_05, SPRPort02_03_11]> {
1832 let NumMicroOps = 2;
1834 def : InstRW<[SPRWriteResGroup156, ReadAfterVecXLd], (instregex "^(V?)MOVLP(D|S)rm$",
1835 "^(V?)SHUFP(D|S)rmi$",
1836 "^VMOVLP(D|S)Z128rm$",
1837 "^VSHUFP(D|S)Z128rm(bi|ik)$",
1838 "^VSHUFP(D|S)Z128rmbik(z?)$",
1839 "^VSHUFP(D|S)Z128rmi((kz)?)$")>;
1841 def SPRWriteResGroup157 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
1843 let NumMicroOps = 2;
1845 def : InstRW<[SPRWriteResGroup157], (instrs MOVNTDQmr)>;
1847 def SPRWriteResGroup158 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
1849 let NumMicroOps = 2;
1851 def : InstRW<[SPRWriteResGroup158], (instrs MOVNTImr)>;
1853 def SPRWriteResGroup159 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
1854 let ReleaseAtCycles = [4, 1, 1, 1];
1856 let NumMicroOps = 7;
1858 def : InstRW<[SPRWriteResGroup159], (instrs MOVSB)>;
1860 def SPRWriteResGroup160 : SchedWriteRes<[SPRPort00_01_05]>;
1861 def : InstRW<[SPRWriteResGroup160], (instregex "^(V?)MOVS(D|S)rr((_REV)?)$",
1862 "^(V?)P(ADD|SUB)(B|D|Q|W)rr$",
1863 "^VMOV(A|U)P(D|S)Z(128|256)rrk(z?)((_REV)?)$",
1864 "^VMOVDQ(A|U)(32|64)Z128rrk(z?)((_REV)?)$",
1865 "^VMOVS(D|H|S)Zrr((_REV)?)$",
1866 "^VMOVS(D|S)Zrrk(z?)((_REV)?)$",
1867 "^VP(ADD|SUB)(B|D|Q|W)Yrr$",
1868 "^VP(ADD|SUB)(B|D|Q|W)Z(128|256)rr$",
1869 "^VP(ADD|SUB)(D|Q)Z(128|256)rrk(z?)$",
1870 "^VPMOVM2(D|Q)Z128rr$",
1871 "^VPTERNLOG(D|Q)Z(128|256)rri((k|kz)?)$")>;
1872 def : InstRW<[SPRWriteResGroup160], (instrs VPBLENDDrri)>;
1874 def SPRWriteResGroup161 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
1875 let ReleaseAtCycles = [4, 1, 1, 1];
1877 let NumMicroOps = 7;
1879 def : InstRW<[SPRWriteResGroup161], (instregex "^MOVS(L|Q|W)$")>;
1881 def SPRWriteResGroup162 : SchedWriteRes<[SPRPort02_03_11]> {
1884 def : InstRW<[SPRWriteResGroup162], (instregex "^MOVSX(16|32|64)rm(16|32)$",
1885 "^MOVSX(32|64)rm8$")>;
1886 def : InstRW<[SPRWriteResGroup162], (instrs MOVSX32rm8_NOREX)>;
1888 def SPRWriteResGroup163 : SchedWriteRes<[SPRPort01_05_10, SPRPort02_03_11]> {
1890 let NumMicroOps = 2;
1892 def : InstRW<[SPRWriteResGroup163], (instrs MOVSX16rm8)>;
1894 def SPRWriteResGroup164 : SchedWriteRes<[SPRPort01_05_10]>;
1895 def : InstRW<[SPRWriteResGroup164], (instregex "^MOVSX(16|32|64)rr(8|16|32)$")>;
1896 def : InstRW<[SPRWriteResGroup164], (instrs MOVSX32rr8_NOREX)>;
1898 def SPRWriteResGroup165 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
1900 let NumMicroOps = 2;
1902 def : InstRW<[SPRWriteResGroup165], (instregex "^MUL_F(32|64)m$",
1903 "^VPABS(B|W)Zrmk(z?)$",
1904 "^VPS(L|R)LWZmik(z?)$",
1905 "^VPSRAWZmik(z?)$")>;
1906 def : InstRW<[SPRWriteResGroup165, ReadAfterVecYLd], (instregex "^VP(ADD|SUB)(U?)S(B|W)Zrmk(z?)$",
1907 "^VPAVG(B|W)Zrmk(z?)$",
1908 "^VPM(AX|IN)(SB|UW)Zrmk(z?)$",
1909 "^VPM(AX|IN)(SW|UB)Zrmk(z?)$",
1910 "^VPSH(L|R)DVWZmk(z?)$",
1911 "^VPS(L|R)L(V?)WZrmk(z?)$",
1912 "^VPSRA(V?)WZrmk(z?)$")>;
1914 def SPRWriteResGroup166 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
1916 let NumMicroOps = 3;
1918 def : InstRW<[SPRWriteResGroup166], (instregex "^MUL_FI(16|32)m$")>;
1920 def SPRWriteResGroup167 : SchedWriteRes<[SPRPort00]> {
1923 def : InstRW<[SPRWriteResGroup167], (instregex "^MUL_F(P?)rST0$",
1924 "^V(U?)COMISHZrr(b?)$",
1925 "^V(U?)COMISHZrr_Int$",
1926 "^VCVT(T?)PD2(U?)QQZrr((b|k|bk|kz)?)$",
1927 "^VCVT(T?)PD2(U?)QQZrrbkz$",
1928 "^VCVT(T?)PS2(U?)DQZrr((b|k|bk|kz)?)$",
1929 "^VCVT(T?)PS2(U?)DQZrrbkz$",
1930 "^VM(AX|IN)(C?)PSZrr((k|kz)?)$",
1931 "^VM(AX|IN)PSZrrb((k|kz)?)$",
1932 "^VPLZCNT(D|Q)Zrr((k|kz)?)$",
1933 "^VPMADD52(H|L)UQZr((k|kz)?)$")>;
1934 def : InstRW<[SPRWriteResGroup167], (instrs MUL_FST0r)>;
1936 def SPRWriteResGroup168 : SchedWriteRes<[SPRPort00_01_05_06, SPRPort05, SPRPort06]> {
1937 let ReleaseAtCycles = [7, 1, 2];
1939 let NumMicroOps = 10;
1941 def : InstRW<[SPRWriteResGroup168], (instrs MWAITrr)>;
1943 def SPRWriteResGroup169 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1944 let ReleaseAtCycles = [6, 4, 1, 28, 15, 7, 1, 16, 1];
1946 let NumMicroOps = 79;
1948 def : InstRW<[SPRWriteResGroup169], (instrs OUT16ir)>;
1950 def SPRWriteResGroup170 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1951 let ReleaseAtCycles = [6, 6, 27, 15, 7, 1, 16, 1];
1953 let NumMicroOps = 79;
1955 def : InstRW<[SPRWriteResGroup170], (instrs OUT16rr)>;
1957 def SPRWriteResGroup171 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1958 let ReleaseAtCycles = [6, 4, 1, 30, 15, 9, 1, 18, 1];
1960 let NumMicroOps = 85;
1962 def : InstRW<[SPRWriteResGroup171], (instrs OUT32ir)>;
1964 def SPRWriteResGroup172 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1965 let ReleaseAtCycles = [6, 6, 29, 15, 9, 1, 18, 1];
1967 let NumMicroOps = 85;
1969 def : InstRW<[SPRWriteResGroup172], (instrs OUT32rr)>;
1971 def SPRWriteResGroup173 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1972 let ReleaseAtCycles = [5, 5, 1, 25, 15, 5, 1, 15, 1];
1974 let NumMicroOps = 73;
1976 def : InstRW<[SPRWriteResGroup173], (instrs OUT8ir)>;
1978 def SPRWriteResGroup174 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1979 let ReleaseAtCycles = [5, 5, 26, 15, 5, 1, 15, 1];
1981 let NumMicroOps = 73;
1983 def : InstRW<[SPRWriteResGroup174], (instrs OUT8rr)>;
1985 def SPRWriteResGroup175 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1986 let ReleaseAtCycles = [7, 6, 25, 16, 7, 1, 17, 1];
1987 let Latency = SapphireRapidsModel.MaxLatency;
1988 let NumMicroOps = 80;
1990 def : InstRW<[SPRWriteResGroup175], (instrs OUTSB)>;
1992 def SPRWriteResGroup176 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
1993 let ReleaseAtCycles = [7, 6, 28, 16, 10, 1, 20, 1];
1994 let Latency = SapphireRapidsModel.MaxLatency;
1995 let NumMicroOps = 89;
1997 def : InstRW<[SPRWriteResGroup176], (instrs OUTSL)>;
1999 def SPRWriteResGroup177 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
2000 let ReleaseAtCycles = [6, 1, 5, 27, 16, 8, 1, 18, 1];
2001 let Latency = SapphireRapidsModel.MaxLatency;
2002 let NumMicroOps = 83;
2004 def : InstRW<[SPRWriteResGroup177], (instrs OUTSW)>;
2006 def SPRWriteResGroup178 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11]> {
2008 let NumMicroOps = 2;
2010 def : InstRW<[SPRWriteResGroup178], (instregex "^VBROADCASTI32X2Z128rmk(z?)$",
2011 "^VBROADCASTSSZ128rmk(z?)$",
2012 "^VMOV(A|U)P(D|S)Z128rmk(z?)$",
2013 "^VMOV(D|SH|SL)DUPZ128rmk(z?)$",
2014 "^VMOVDQ(A|U)(32|64)Z128rmk(z?)$",
2015 "^VMOVS(D|S)Zrmk(z?)$",
2016 "^VPBROADCAST(D|Q)Z128rmk(z?)$")>;
2017 def : InstRW<[SPRWriteResGroup178, ReadAfterVecXLd], (instregex "^(V?)P(ADD|SUB)(B|D|Q|W)rm$",
2018 "^VP(ADD|SUB)(B|D|Q|W)Z128rm$",
2019 "^VP(ADD|SUB)(D|Q)Z128rm(b|k|kz)$",
2020 "^VP(ADD|SUB)(D|Q)Z128rmbk(z?)$",
2021 "^VPTERNLOG(D|Q)Z128rm(bi|ik)$",
2022 "^VPTERNLOG(D|Q)Z128rmbik(z?)$",
2023 "^VPTERNLOG(D|Q)Z128rmi((kz)?)$")>;
2024 def : InstRW<[SPRWriteResGroup178, ReadAfterVecXLd], (instrs VPBLENDDrmi)>;
2026 def SPRWriteResGroup179 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
2028 let NumMicroOps = 2;
2030 def : InstRW<[SPRWriteResGroup179], (instregex "^VPBROADCAST(B|W)((Z128)?)rm$")>;
2031 def : InstRW<[SPRWriteResGroup179, ReadAfterVecXLd], (instregex "^(V?)PALIGNRrmi$",
2032 "^VALIGN(D|Q)Z128rm(bi|ik)$",
2033 "^VALIGN(D|Q)Z128rmbik(z?)$",
2034 "^VALIGN(D|Q)Z128rmi((kz)?)$")>;
2035 def : InstRW<[SPRWriteResGroup179, ReadAfterVecXLd], (instrs VPALIGNRZ128rmi)>;
2037 def SPRWriteResGroup180 : SchedWriteRes<[SPRPort00_06, SPRPort05]> {
2039 let NumMicroOps = 2;
2041 def : InstRW<[SPRWriteResGroup180], (instrs PAUSE)>;
2043 def SPRWriteResGroup181 : SchedWriteRes<[SPRPort01, SPRPort02_03_11]> {
2045 let NumMicroOps = 2;
2047 def : InstRW<[SPRWriteResGroup181, ReadAfterLd], (instregex "^P(DEP|EXT)(32|64)rm$")>;
2049 def SPRWriteResGroup182 : SchedWriteRes<[SPRPort01_05, SPRPort04_09, SPRPort07_08]> {
2051 let NumMicroOps = 3;
2053 def : InstRW<[SPRWriteResGroup182], (instregex "^(V?)PEXTR(D|Q)mr$",
2055 "^VPMOVQDZ128mr(k?)$")>;
2057 def SPRWriteResGroup183 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11]> {
2058 let ReleaseAtCycles = [1, 2, 1];
2060 let NumMicroOps = 4;
2062 def : InstRW<[SPRWriteResGroup183, ReadAfterVecXLd], (instregex "^(V?)PH(ADD|SUB)SWrm$")>;
2064 def SPRWriteResGroup184 : SchedWriteRes<[SPRPort00_01, SPRPort01_05]> {
2065 let ReleaseAtCycles = [1, 2];
2067 let NumMicroOps = 3;
2069 def : InstRW<[SPRWriteResGroup184], (instregex "^(V?)PH(ADD|SUB)SWrr$",
2070 "^VPH(ADD|SUB)SWYrr$")>;
2072 def SPRWriteResGroup185 : SchedWriteRes<[SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
2074 let NumMicroOps = 3;
2076 def : InstRW<[SPRWriteResGroup185], (instregex "^POP(16|32|64)rmm$",
2077 "^PUSH(16|32)rmm$")>;
2079 def SPRWriteResGroup186 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort02_03_11]> {
2080 let ReleaseAtCycles = [6, 2, 1, 1];
2082 let NumMicroOps = 10;
2084 def : InstRW<[SPRWriteResGroup186], (instrs POPF16)>;
2086 def SPRWriteResGroup187 : SchedWriteRes<[SPRPort00_06, SPRPort01, SPRPort02_03_11]> {
2087 let ReleaseAtCycles = [2, 1, 1];
2089 let NumMicroOps = 7;
2091 def : InstRW<[SPRWriteResGroup187], (instrs POPF64)>;
2093 def SPRWriteResGroup188 : SchedWriteRes<[SPRPort02_03_11]> {
2096 def : InstRW<[SPRWriteResGroup188], (instregex "^PREFETCHT(0|1|2)$")>;
2097 def : InstRW<[SPRWriteResGroup188], (instrs PREFETCHNTA)>;
2099 def SPRWriteResGroup189 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11, SPRPort06]> {
2100 let ReleaseAtCycles = [1, 1, 2];
2101 let Latency = SapphireRapidsModel.MaxLatency;
2102 let NumMicroOps = 4;
2104 def : InstRW<[SPRWriteResGroup189], (instregex "^PTWRITE((64)?)m$")>;
2106 def SPRWriteResGroup190 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort06]> {
2107 let ReleaseAtCycles = [1, 2];
2108 let Latency = SapphireRapidsModel.MaxLatency;
2109 let NumMicroOps = 3;
2111 def : InstRW<[SPRWriteResGroup190], (instrs PTWRITE64r)>;
2113 def SPRWriteResGroup191 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort06]> {
2114 let ReleaseAtCycles = [2, 2];
2115 let Latency = SapphireRapidsModel.MaxLatency;
2116 let NumMicroOps = 4;
2118 def : InstRW<[SPRWriteResGroup191], (instrs PTWRITEr)>;
2120 def SPRWriteResGroup192 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
2121 let NumMicroOps = 2;
2123 def : InstRW<[SPRWriteResGroup192], (instregex "^PUSH64r((mr)?)$")>;
2125 def SPRWriteResGroup193 : SchedWriteRes<[SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
2126 let NumMicroOps = 3;
2128 def : InstRW<[SPRWriteResGroup193], (instrs PUSH64rmm)>;
2130 def SPRWriteResGroup194 : SchedWriteRes<[SPRPort00_06, SPRPort01, SPRPort04_09, SPRPort07_08]> {
2132 let NumMicroOps = 4;
2134 def : InstRW<[SPRWriteResGroup194], (instrs PUSHF64)>;
2136 def SPRWriteResGroup195 : SchedWriteRes<[SPRPort01, SPRPort04_09, SPRPort07_08]> {
2137 let NumMicroOps = 3;
2139 def : InstRW<[SPRWriteResGroup195], (instregex "^PUSH(F|G)S64$")>;
2141 def SPRWriteResGroup196 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
2142 let ReleaseAtCycles = [2, 3, 2];
2144 let NumMicroOps = 7;
2146 def : InstRW<[SPRWriteResGroup196], (instregex "^RC(L|R)(16|32|64)rCL$")>;
2148 def SPRWriteResGroup197 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06]> {
2149 let ReleaseAtCycles = [1, 2];
2151 let NumMicroOps = 3;
2153 def : InstRW<[SPRWriteResGroup197, WriteRMW], (instregex "^RC(L|R)8m(1|i)$")>;
2155 def SPRWriteResGroup198 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
2156 let ReleaseAtCycles = [1, 5, 2];
2158 let NumMicroOps = 8;
2160 def : InstRW<[SPRWriteResGroup198, WriteRMW], (instrs RCL8mCL)>;
2162 def SPRWriteResGroup199 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
2163 let ReleaseAtCycles = [2, 5, 2];
2165 let NumMicroOps = 9;
2167 def : InstRW<[SPRWriteResGroup199], (instrs RCL8rCL)>;
2169 def SPRWriteResGroup200 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
2170 let ReleaseAtCycles = [2, 4, 3];
2172 let NumMicroOps = 9;
2174 def : InstRW<[SPRWriteResGroup200, WriteRMW], (instrs RCR8mCL)>;
2176 def SPRWriteResGroup201 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
2177 let ReleaseAtCycles = [3, 4, 3];
2179 let NumMicroOps = 10;
2181 def : InstRW<[SPRWriteResGroup201], (instrs RCR8rCL)>;
2183 def SPRWriteResGroup202 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_05, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort01_05_10, SPRPort05]> {
2184 let ReleaseAtCycles = [1, 6, 1, 10, 20, 8, 5, 1, 2];
2185 let Latency = SapphireRapidsModel.MaxLatency;
2186 let NumMicroOps = 54;
2188 def : InstRW<[SPRWriteResGroup202], (instrs RDMSR)>;
2190 def SPRWriteResGroup203 : SchedWriteRes<[SPRPort01]> {
2191 let Latency = SapphireRapidsModel.MaxLatency;
2193 def : InstRW<[SPRWriteResGroup203], (instrs RDPID64)>;
2195 def SPRWriteResGroup204 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
2196 let Latency = SapphireRapidsModel.MaxLatency;
2197 let NumMicroOps = 3;
2199 def : InstRW<[SPRWriteResGroup204], (instrs RDPKRUr)>;
2201 def SPRWriteResGroup205 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort05]> {
2202 let ReleaseAtCycles = [9, 6, 2, 1];
2203 let Latency = SapphireRapidsModel.MaxLatency;
2204 let NumMicroOps = 18;
2206 def : InstRW<[SPRWriteResGroup205], (instrs RDPMC)>;
2208 def SPRWriteResGroup206 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2209 let ReleaseAtCycles = [2, 3, 2, 5, 7, 3, 1, 2];
2211 let NumMicroOps = 25;
2213 def : InstRW<[SPRWriteResGroup206], (instrs RDRAND16r)>;
2215 def SPRWriteResGroup207 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2216 let ReleaseAtCycles = [2, 3, 2, 5, 7, 3, 1, 2];
2217 let Latency = SapphireRapidsModel.MaxLatency;
2218 let NumMicroOps = 25;
2220 def : InstRW<[SPRWriteResGroup207], (instregex "^RDRAND(32|64)r$")>;
2222 def SPRWriteResGroup208 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05]> {
2223 let ReleaseAtCycles = [2, 3, 3, 5, 7, 1, 4];
2225 let NumMicroOps = 25;
2227 def : InstRW<[SPRWriteResGroup208], (instrs RDSEED16r)>;
2229 def SPRWriteResGroup209 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort05]> {
2230 let ReleaseAtCycles = [2, 3, 3, 5, 7, 1, 4];
2231 let Latency = SapphireRapidsModel.MaxLatency;
2232 let NumMicroOps = 25;
2234 def : InstRW<[SPRWriteResGroup209], (instregex "^RDSEED(32|64)r$")>;
2236 def SPRWriteResGroup210 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort05]> {
2237 let ReleaseAtCycles = [5, 6, 3, 1];
2239 let NumMicroOps = 15;
2241 def : InstRW<[SPRWriteResGroup210], (instrs RDTSC)>;
2243 def SPRWriteResGroup211 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort05]> {
2244 let ReleaseAtCycles = [2, 2, 1, 2, 7, 4, 3];
2246 let NumMicroOps = 21;
2248 def : InstRW<[SPRWriteResGroup211], (instrs RDTSCP)>;
2250 def SPRWriteResGroup212 : SchedWriteRes<[SPRPort00_06, SPRPort02_03_11]> {
2252 let NumMicroOps = 2;
2254 def : InstRW<[SPRWriteResGroup212], (instrs RET64)>;
2256 def SPRWriteResGroup213 : SchedWriteRes<[SPRPort00_06, SPRPort02_03_11]> {
2257 let ReleaseAtCycles = [2, 1];
2259 let NumMicroOps = 3;
2261 def : InstRW<[SPRWriteResGroup213], (instregex "^RETI(16|32|64)$")>;
2263 def SPRWriteResGroup214 : SchedWriteRes<[]>;
2264 def : InstRW<[SPRWriteResGroup214], (instrs REX64_PREFIX)>;
2266 def SPRWriteResGroup215 : SchedWriteRes<[SPRPort00_06]> {
2267 let ReleaseAtCycles = [2];
2269 let NumMicroOps = 2;
2271 def : InstRW<[SPRWriteResGroup215, WriteRMW], (instregex "^RO(L|R)(16|32|64)m(1|i|CL)$")>;
2273 def SPRWriteResGroup216 : SchedWriteRes<[SPRPort00_06]> {
2274 let ReleaseAtCycles = [2];
2275 let NumMicroOps = 2;
2277 def : InstRW<[SPRWriteResGroup216], (instregex "^RO(L|R)(8|16|32|64)r(1|i)$")>;
2279 def SPRWriteResGroup217 : SchedWriteRes<[SPRPort00_06]> {
2280 let ReleaseAtCycles = [2];
2282 let NumMicroOps = 2;
2284 def : InstRW<[SPRWriteResGroup217, WriteRMW], (instregex "^RO(L|R)8m(1|i)$",
2286 "^(RO|SA|SH)R8mCL$")>;
2288 def SPRWriteResGroup218 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
2289 let ReleaseAtCycles = [2, 1];
2291 let NumMicroOps = 3;
2293 def : InstRW<[SPRWriteResGroup218], (instregex "^(V?)ROUNDP(D|S)m$")>;
2294 def : InstRW<[SPRWriteResGroup218, ReadAfterVecXLd], (instregex "^(V?)ROUNDS(D|S)m((_Int)?)$",
2295 "^VRNDSCALEP(D|S)Z128rm(bi|ik)$",
2296 "^VRNDSCALEP(D|S)Z128rmbik(z?)$",
2297 "^VRNDSCALEP(D|S)Z128rmi((kz)?)$",
2298 "^VRNDSCALES(D|S)Zm$",
2299 "^VRNDSCALES(D|S)Zm_Int((k|kz)?)$")>;
2301 def SPRWriteResGroup219 : SchedWriteRes<[SPRPort00_01]> {
2302 let ReleaseAtCycles = [2];
2304 let NumMicroOps = 2;
2306 def : InstRW<[SPRWriteResGroup219], (instregex "^(V?)ROUND(PD|SS)r$",
2307 "^(V?)ROUND(PS|SD)r$",
2308 "^(V?)ROUNDS(D|S)r_Int$",
2309 "^VRNDSCALEP(D|S)Z(128|256)rri((k|kz)?)$",
2310 "^VRNDSCALES(D|S)Zr$",
2311 "^VRNDSCALES(D|S)Zr(b?)_Int((k|kz)?)$",
2312 "^VROUNDP(D|S)Yr$")>;
2314 def SPRWriteResGroup220 : SchedWriteRes<[SPRPort00_06]> {
2315 let ReleaseAtCycles = [2];
2317 let NumMicroOps = 2;
2319 def : InstRW<[SPRWriteResGroup220], (instrs SAHF)>;
2321 def SPRWriteResGroup221 : SchedWriteRes<[SPRPort00_06]> {
2324 def : InstRW<[SPRWriteResGroup221, WriteRMW], (instregex "^S(A|H)R8m(1|i)$",
2327 def SPRWriteResGroup222 : SchedWriteRes<[SPRPort00_06, SPRPort02_03_11]> {
2329 let NumMicroOps = 2;
2331 def : InstRW<[SPRWriteResGroup222, ReadAfterLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^S(A|H)RX(32|64)rm$",
2332 "^SHLX(32|64)rm$")>;
2334 def SPRWriteResGroup223 : SchedWriteRes<[SPRPort00_06]> {
2337 def : InstRW<[SPRWriteResGroup223], (instregex "^S(A|H)RX(32|64)rr$",
2338 "^SHLX(32|64)rr$")>;
2340 def SPRWriteResGroup224 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort04_09, SPRPort07_08]> {
2341 let ReleaseAtCycles = [2, 2, 1, 1, 1];
2342 let Latency = SapphireRapidsModel.MaxLatency;
2343 let NumMicroOps = 7;
2345 def : InstRW<[SPRWriteResGroup224], (instrs SERIALIZE)>;
2347 def SPRWriteResGroup225 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
2349 let NumMicroOps = 2;
2351 def : InstRW<[SPRWriteResGroup225], (instrs SFENCE)>;
2353 def SPRWriteResGroup226 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort01, SPRPort04_09, SPRPort07_08]> {
2354 let ReleaseAtCycles = [1, 2, 2, 2];
2356 let NumMicroOps = 7;
2358 def : InstRW<[SPRWriteResGroup226], (instregex "^S(G|I)DT64m$")>;
2360 def SPRWriteResGroup227 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
2362 let NumMicroOps = 3;
2364 def : InstRW<[SPRWriteResGroup227, ReadAfterVecXLd], (instrs SHA1MSG1rm)>;
2366 def SPRWriteResGroup228 : SchedWriteRes<[SPRPort00_01_05, SPRPort05]> {
2368 let NumMicroOps = 2;
2370 def : InstRW<[SPRWriteResGroup228], (instrs SHA1MSG1rr)>;
2372 def SPRWriteResGroup229 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort01_05, SPRPort02_03_11]> {
2373 let ReleaseAtCycles = [2, 2, 1, 2, 1];
2375 let NumMicroOps = 8;
2377 def : InstRW<[SPRWriteResGroup229, ReadAfterVecXLd], (instrs SHA1MSG2rm)>;
2379 def SPRWriteResGroup230 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort01_05]> {
2380 let ReleaseAtCycles = [2, 2, 1, 2];
2382 let NumMicroOps = 7;
2384 def : InstRW<[SPRWriteResGroup230], (instrs SHA1MSG2rr)>;
2386 def SPRWriteResGroup231 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11]> {
2388 let NumMicroOps = 4;
2390 def : InstRW<[SPRWriteResGroup231, ReadAfterVecXLd], (instrs SHA1NEXTErm)>;
2392 def SPRWriteResGroup232 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05]> {
2394 let NumMicroOps = 3;
2396 def : InstRW<[SPRWriteResGroup232], (instrs SHA1NEXTErr)>;
2398 def SPRWriteResGroup233 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
2400 let NumMicroOps = 2;
2402 def : InstRW<[SPRWriteResGroup233], (instregex "^VPMOV(S|Z)XBWZ((256)?)rmk(z?)$",
2403 "^VPOPCNT(B|W)Z(128|256)rmk(z?)$",
2404 "^VPOPCNT(B|W)Zrmk(z?)$")>;
2405 def : InstRW<[SPRWriteResGroup233, ReadAfterVecXLd], (instregex "^VDBPSADBWZ128rmik(z?)$",
2406 "^VPACK(S|U)SDWZ128rm(bk|kz)$",
2407 "^VPACK(S|U)SDWZ128rmbkz$",
2408 "^VPACK(S|U)S(DW|WB)Z128rmk$",
2409 "^VPACK(S|U)SWBZ128rmkz$",
2410 "^VPMULTISHIFTQBZ128rm(bk|kz)$",
2411 "^VPMULTISHIFTQBZ128rm(k|bkz)$")>;
2412 def : InstRW<[SPRWriteResGroup233, ReadAfterVecXLd], (instrs SHA1RNDS4rmi,
2414 def : InstRW<[SPRWriteResGroup233, ReadAfterVecYLd], (instregex "^VDBPSADBWZ((256)?)rmik(z?)$",
2415 "^VPACK(S|U)SDWZ((256)?)rm(bk|kz)$",
2416 "^VPACK(S|U)SDWZ((256)?)rmbkz$",
2417 "^VPACK(S|U)S(DW|WB)Z((256)?)rmk$",
2418 "^VPACK(S|U)SWBZ((256)?)rmkz$",
2419 "^VPERMBZ(128|256)rmk(z?)$",
2421 "^VPMULTISHIFTQBZ((256)?)rm(bk|kz)$",
2422 "^VPMULTISHIFTQBZ((256)?)rm(k|bkz)$")>;
2424 def SPRWriteResGroup234 : SchedWriteRes<[SPRPort05]> {
2427 def : InstRW<[SPRWriteResGroup234], (instrs SHA1RNDS4rri,
2430 def SPRWriteResGroup235 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
2431 let ReleaseAtCycles = [3, 2, 1, 1, 1];
2433 let NumMicroOps = 8;
2435 def : InstRW<[SPRWriteResGroup235, ReadAfterVecXLd], (instrs SHA256MSG1rm)>;
2437 def SPRWriteResGroup236 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort05]> {
2438 let ReleaseAtCycles = [3, 2, 1, 1];
2440 let NumMicroOps = 7;
2442 def : InstRW<[SPRWriteResGroup236], (instrs SHA256MSG1rr)>;
2444 def SPRWriteResGroup237 : SchedWriteRes<[SPRPort05]> {
2445 let ReleaseAtCycles = [2];
2447 let NumMicroOps = 2;
2449 def : InstRW<[SPRWriteResGroup237], (instregex "^VPMOV(D|Q|W|SQ|SW)BZrrk(z?)$",
2450 "^VPMOV((S|US)?)(D|Q)WZrrk(z?)$",
2451 "^VPMOV(U?)SDBZrrk(z?)$",
2452 "^VPMOVUS(Q|W)BZrrk(z?)$")>;
2453 def : InstRW<[SPRWriteResGroup237], (instrs SHA256MSG2rr)>;
2455 def SPRWriteResGroup238 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort07_08]> {
2457 let NumMicroOps = 5;
2459 def : InstRW<[SPRWriteResGroup238], (instrs SHRD16mri8)>;
2461 def SPRWriteResGroup239 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort01]> {
2463 let NumMicroOps = 2;
2465 def : InstRW<[SPRWriteResGroup239], (instregex "^SLDT(32|64)r$")>;
2467 def SPRWriteResGroup240 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort05]> {
2468 let NumMicroOps = 2;
2470 def : InstRW<[SPRWriteResGroup240], (instrs SMSW16r)>;
2472 def SPRWriteResGroup241 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort05]> {
2473 let Latency = SapphireRapidsModel.MaxLatency;
2474 let NumMicroOps = 2;
2476 def : InstRW<[SPRWriteResGroup241], (instregex "^SMSW(32|64)r$")>;
2478 def SPRWriteResGroup242 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
2480 let NumMicroOps = 2;
2482 def : InstRW<[SPRWriteResGroup242, ReadAfterVecLd], (instregex "^(V?)SQRTSDm_Int$")>;
2483 def : InstRW<[SPRWriteResGroup242, ReadAfterVecLd], (instrs VSQRTSDZm_Int)>;
2485 def SPRWriteResGroup243 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06]> {
2487 let NumMicroOps = 2;
2489 def : InstRW<[SPRWriteResGroup243], (instrs STD)>;
2491 def SPRWriteResGroup244 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01]> {
2492 let ReleaseAtCycles = [1, 4, 1];
2493 let Latency = SapphireRapidsModel.MaxLatency;
2494 let NumMicroOps = 6;
2496 def : InstRW<[SPRWriteResGroup244], (instrs STI)>;
2498 def SPRWriteResGroup245 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
2499 let ReleaseAtCycles = [2, 1, 1];
2501 let NumMicroOps = 4;
2503 def : InstRW<[SPRWriteResGroup245], (instrs STOSB)>;
2505 def SPRWriteResGroup246 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
2506 let ReleaseAtCycles = [2, 1, 1];
2508 let NumMicroOps = 4;
2510 def : InstRW<[SPRWriteResGroup246], (instregex "^STOS(L|Q|W)$")>;
2512 def SPRWriteResGroup247 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort01]> {
2514 let NumMicroOps = 2;
2516 def : InstRW<[SPRWriteResGroup247], (instregex "^STR(32|64)r$")>;
2518 def SPRWriteResGroup248 : SchedWriteRes<[SPRPort00]> {
2521 def : InstRW<[SPRWriteResGroup248], (instregex "^(TST|XAM)_F$")>;
2522 def : InstRW<[SPRWriteResGroup248], (instrs UCOM_FPPr)>;
2524 def SPRWriteResGroup249 : SchedWriteRes<[SPRPort01_05]> {
2527 def : InstRW<[SPRWriteResGroup249], (instregex "^V(ADD|SUB)P(D|S)Z(128|256)rrkz$",
2528 "^V(ADD|SUB)S(D|S)Zrr(b?)_Intkz$")>;
2530 def SPRWriteResGroup250 : SchedWriteRes<[SPRPort00_05]> {
2533 def : InstRW<[SPRWriteResGroup250], (instregex "^V(ADD|SUB)P(D|S)Zrr(b?)$",
2534 "^VMOVDQU(8|16)Zrrk(z?)((_REV)?)$",
2535 "^VP(ADD|SUB)(B|W)Zrrk(z?)$",
2536 "^VPBLENDM(B|W)Zrrk(z?)$",
2537 "^VPMOVM2(B|W)Zrr$")>;
2539 def SPRWriteResGroup251 : SchedWriteRes<[SPRPort00_01]> {
2542 def : InstRW<[SPRWriteResGroup251], (instregex "^V(ADD|SUB)PHZ(128|256)rrk(z?)$",
2543 "^V(ADD|SUB)SHZrr(b?)_Intk(z?)$",
2544 "^VCVT(T?)PH2(U?)WZ(128|256)rrk(z?)$",
2545 "^VCVT(U?)W2PHZ(128|256)rrk(z?)$",
2546 "^VF(N?)M(ADD|SUB)(132|213|231)PHZ(128|256)rk(z?)$",
2547 "^VF(N?)M(ADD|SUB)(132|213|231)SHZr(b?)_Intk(z?)$",
2548 "^VFMADDSUB(132|213|231)PHZ(128|256)rk(z?)$",
2549 "^VFMSUBADD(132|213|231)PHZ(128|256)rk(z?)$",
2550 "^VGETEXPPHZ(128|256)rk(z?)$",
2551 "^VGETEXPSHZr(bk|kz)$",
2552 "^VGETEXPSHZr(k|bkz)$",
2553 "^VGETMANTPHZ(128|256)rrik(z?)$",
2554 "^VGETMANTSHZrri(bk|kz)$",
2555 "^VGETMANTSHZrri(k|bkz)$",
2556 "^VM(AX|IN)CPHZ(128|256)rrk(z?)$",
2557 "^VM(AX|IN|UL)PHZ(128|256)rrk(z?)$",
2558 "^VM(AX|IN|UL)SHZrr(b?)_Intk(z?)$")>;
2560 def SPRWriteResGroup252 : SchedWriteRes<[SPRPort00]> {
2563 def : InstRW<[SPRWriteResGroup252], (instregex "^V(ADD|SUB)PHZrr(b?)$",
2564 "^VAES(DE|EN)C((LAST)?)Zrr$",
2565 "^VCVT(T?)PH2(U?)WZrr(b?)$",
2566 "^VCVT(U?)W2PHZrr(b?)$",
2567 "^VF(N?)M(ADD|SUB)(132|213|231)PHZr(b?)$",
2568 "^VFMADDSUB(132|213|231)PHZr(b?)$",
2569 "^VFMSUBADD(132|213|231)PHZr(b?)$",
2570 "^VGETEXPPHZr(b?)$",
2571 "^VGETMANTPHZrri(b?)$",
2572 "^VM(AX|IN)CPHZrr$",
2573 "^VM(AX|IN|UL)PHZrr(b?)$",
2574 "^VMOVMSKP(D|S)Yrr$")>;
2575 def : InstRW<[SPRWriteResGroup252], (instrs VGF2P8MULBZrr)>;
2577 def SPRWriteResGroup253 : SchedWriteRes<[SPRPort00]> {
2580 def : InstRW<[SPRWriteResGroup253], (instregex "^V(ADD|SUB)PHZrr(bk|kz)$",
2581 "^V(ADD|SUB)PHZrr(k|bkz)$",
2582 "^VCVT(T?)PH2(U?)WZrr(bk|kz)$",
2583 "^VCVT(T?)PH2(U?)WZrr(k|bkz)$",
2584 "^VCVT(U?)W2PHZrr(bk|kz)$",
2585 "^VCVT(U?)W2PHZrr(k|bkz)$",
2586 "^VF(N?)M(ADD|SUB)(132|213|231)PHZr(bk|kz)$",
2587 "^VF(N?)M(ADD|SUB)(132|213|231)PHZr(k|bkz)$",
2588 "^VFMADDSUB(132|213|231)PHZr(bk|kz)$",
2589 "^VFMADDSUB(132|213|231)PHZr(k|bkz)$",
2590 "^VFMSUBADD(132|213|231)PHZr(bk|kz)$",
2591 "^VFMSUBADD(132|213|231)PHZr(k|bkz)$",
2592 "^VGETEXPPHZr(bk|kz)$",
2593 "^VGETEXPPHZr(k|bkz)$",
2594 "^VGETMANTPHZrri(bk|kz)$",
2595 "^VGETMANTPHZrri(k|bkz)$",
2596 "^VM(AX|IN)CPHZrrk(z?)$",
2597 "^VM(AX|IN|UL)PHZrr(bk|kz)$",
2598 "^VM(AX|IN|UL)PHZrr(k|bkz)$")>;
2600 def SPRWriteResGroup254 : SchedWriteRes<[SPRPort01_05, SPRPort02_03_11]> {
2602 let NumMicroOps = 2;
2604 def : InstRW<[SPRWriteResGroup254], (instregex "^VPMOV(S|Z)XBWZ128rmk(z?)$",
2605 "^VPSHUF(H|L)WZ(128|256)mik(z?)$")>;
2606 def : InstRW<[SPRWriteResGroup254, ReadAfterVecYLd], (instregex "^V(ADD|SUB)PSYrm$",
2607 "^V(ADD|SUB)PSZ256rm((b|k|bk|kz)?)$",
2608 "^V(ADD|SUB)PSZ256rmbkz$",
2609 "^VPSHUFBZ256rmk(z?)$",
2610 "^VPUNPCK(H|L)(BW|WD)Z256rmk(z?)$")>;
2611 def : InstRW<[SPRWriteResGroup254, ReadAfterVecYLd], (instrs VADDSUBPSYrm)>;
2612 def : InstRW<[SPRWriteResGroup254, ReadAfterVecXLd], (instregex "^VPSHUFBZ128rmk(z?)$",
2613 "^VPUNPCK(H|L)(BW|WD)Z128rmk(z?)$")>;
2615 def SPRWriteResGroup255 : SchedWriteRes<[SPRPort00_05, SPRPort02_03_11]> {
2617 let NumMicroOps = 2;
2619 def : InstRW<[SPRWriteResGroup255], (instregex "^VMOVDQU(8|16)Zrmk(z?)$")>;
2620 def : InstRW<[SPRWriteResGroup255, ReadAfterVecYLd], (instregex "^V(ADD|SUB)PSZrm((b|k|bk|kz)?)$",
2621 "^V(ADD|SUB)PSZrmbkz$",
2622 "^VP(ADD|SUB)(B|W)Zrmk(z?)$",
2623 "^VPBLENDM(B|W)Zrmk(z?)$")>;
2625 def SPRWriteResGroup256 : SchedWriteRes<[SPRPort00_05]> {
2628 def : InstRW<[SPRWriteResGroup256], (instregex "^V(ADD|SUB)PSZrr(bk|kz)$",
2629 "^V(ADD|SUB)PSZrr(k|bkz)$")>;
2631 def SPRWriteResGroup257 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
2633 let NumMicroOps = 2;
2635 def : InstRW<[SPRWriteResGroup257], (instregex "^VCVT(T?)PS2(U?)DQZrm((b|k|bk|kz)?)$",
2636 "^VCVT(T?)PS2(U?)DQZrmbkz$",
2637 "^VPLZCNT(D|Q)Zrm((b|k|bk|kz)?)$",
2638 "^VPLZCNT(D|Q)Zrmbkz$")>;
2639 def : InstRW<[SPRWriteResGroup257, ReadAfterVecXLd], (instregex "^VAES(DE|EN)C((LAST)?)Zrm$")>;
2640 def : InstRW<[SPRWriteResGroup257, ReadAfterVecYLd], (instregex "^VGF2P8AFFINE((INV)?)QBZrm(b?)i$")>;
2641 def : InstRW<[SPRWriteResGroup257, ReadAfterVecYLd], (instrs VGF2P8MULBZrm)>;
2642 def : InstRW<[SPRWriteResGroup257, ReadAfterVecYLd, ReadAfterVecYLd], (instregex "^VPMADD52(H|L)UQZm((b|k|bk|kz)?)$",
2643 "^VPMADD52(H|L)UQZmbkz$")>;
2645 def SPRWriteResGroup258 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
2647 let NumMicroOps = 2;
2649 def : InstRW<[SPRWriteResGroup258], (instregex "^VPBROADCAST(B|W)Z128rmk(z?)$",
2650 "^VPOPCNT(B|D|Q|W)Z((256)?)rm$",
2651 "^VPOPCNT(D|Q)Z((256)?)rm(b|k|kz)$",
2652 "^VPOPCNT(D|Q)Z((256)?)rmbk(z?)$",
2653 "^VPSHUF(H|L)WZmik(z?)$")>;
2654 def : InstRW<[SPRWriteResGroup258, ReadAfterVecYLd], (instregex "^VALIGN(D|Q)Z((256)?)rm(bi|ik)$",
2655 "^VALIGN(D|Q)Z((256)?)rmbik(z?)$",
2656 "^VALIGN(D|Q)Z((256)?)rmi((kz)?)$",
2657 "^VFPCLASSP(D|H|S)Z((256)?)rmb$",
2658 "^VPACK(S|U)S(DW|WB)(Y|Z)rm$",
2659 "^VPACK(S|U)S(DW|WB)Z256rm$",
2660 "^VPACK(S|U)SDWZ((256)?)rmb$",
2661 "^VPALIGNRZ((256)?)rmik(z?)$",
2662 "^VPM(AX|IN)(S|U)QZ((256)?)rm((b|k|bk|kz)?)$",
2663 "^VPM(AX|IN)(S|U)QZ((256)?)rmbkz$",
2664 "^VPMULTISHIFTQBZ((256)?)rm(b?)$",
2665 "^VPUNPCK(H|L)(BW|WD)Zrmk(z?)$")>;
2666 def : InstRW<[SPRWriteResGroup258, ReadAfterVecYLd], (instrs VPCMPGTQYrm)>;
2667 def : InstRW<[SPRWriteResGroup258, ReadAfterVecXLd], (instregex "^VPALIGNRZ128rmik(z?)$",
2668 "^VPCLMULQDQ(Y|Z)rm$")>;
2669 def : InstRW<[SPRWriteResGroup258, ReadAfterVecXLd], (instrs VPCLMULQDQZ256rm)>;
2671 def SPRWriteResGroup259 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11]> {
2672 let ReleaseAtCycles = [3, 1];
2674 let NumMicroOps = 4;
2676 def : InstRW<[SPRWriteResGroup259, ReadAfterVecYLd, ReadAfterVecYLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^VBLENDVP(D|S)Yrm$")>;
2677 def : InstRW<[SPRWriteResGroup259, ReadAfterVecYLd, ReadAfterVecYLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instrs VPBLENDVBYrm)>;
2679 def SPRWriteResGroup260 : SchedWriteRes<[SPRPort00_01_05]> {
2680 let ReleaseAtCycles = [3];
2682 let NumMicroOps = 3;
2684 def : InstRW<[SPRWriteResGroup260], (instregex "^VBLENDVP(S|DY)rr$",
2685 "^VBLENDVP(D|SY)rr$",
2686 "^VPBLENDVB(Y?)rr$")>;
2688 def SPRWriteResGroup261 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11]> {
2689 let ReleaseAtCycles = [3, 1];
2691 let NumMicroOps = 4;
2693 def : InstRW<[SPRWriteResGroup261, ReadAfterVecXLd, ReadAfterVecXLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instregex "^VBLENDVP(D|S)rm$")>;
2694 def : InstRW<[SPRWriteResGroup261, ReadAfterVecXLd, ReadAfterVecXLd, ReadDefault, ReadDefault, ReadDefault, ReadDefault, ReadDefault], (instrs VPBLENDVBrm)>;
2696 def SPRWriteResGroup262 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11]> {
2698 let NumMicroOps = 2;
2700 def : InstRW<[SPRWriteResGroup262], (instregex "^VBROADCAST(F|I)32X(2|4)Z256rmk(z?)$",
2701 "^VBROADCAST(F|I)64X2Z128rmk(z?)$",
2702 "^VBROADCASTS(D|S)Z256rmk(z?)$",
2703 "^VMOV(A|U)P(D|S)Z256rmk(z?)$",
2704 "^VMOV(D|SH|SL)DUPZ256rmk(z?)$",
2705 "^VMOVDQ(A|U)(32|64)Z256rmk(z?)$",
2706 "^VPBROADCAST(D|Q)Z256rmk(z?)$")>;
2707 def : InstRW<[SPRWriteResGroup262, ReadAfterVecYLd], (instregex "^VINSERT(F|I)128rm$",
2708 "^VINSERT(F|I)(32x4|64x2)Z256rm((k|kz)?)$",
2709 "^VP(ADD|SUB)(B|D|Q|W)(Y|Z256)rm$",
2710 "^VP(ADD|SUB)(D|Q)Z256rm(b|k|kz)$",
2711 "^VP(ADD|SUB)(D|Q)Z256rmbk(z?)$",
2712 "^VPTERNLOG(D|Q)Z256rm(bi|ik)$",
2713 "^VPTERNLOG(D|Q)Z256rmbik(z?)$",
2714 "^VPTERNLOG(D|Q)Z256rmi((kz)?)$")>;
2716 def SPRWriteResGroup263 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
2718 let NumMicroOps = 2;
2720 def : InstRW<[SPRWriteResGroup263, ReadAfterVecXLd], (instregex "^VCMPP(D|H|S)Z128rm(bi|ik)$",
2721 "^VCMPP(D|H|S)Z128rm(i|bik)$",
2722 "^VFPCLASSP(D|H|S)Z128rm(b?)k$",
2723 "^VPCMP(B|D|Q|W|UD|UQ|UW)Z128rmi(k?)$",
2724 "^VPCMP(D|Q|UQ)Z128rmib(k?)$",
2725 "^VPCMP(EQ|GT)(B|D|Q|W)Z128rm(k?)$",
2726 "^VPCMP(EQ|GT)(D|Q)Z128rmb(k?)$",
2727 "^VPCMPUBZ128rmi(k?)$",
2728 "^VPCMPUDZ128rmib(k?)$",
2729 "^VPTEST(N?)M(B|D|Q|W)Z128rm(k?)$",
2730 "^VPTEST(N?)M(D|Q)Z128rmb(k?)$")>;
2731 def : InstRW<[SPRWriteResGroup263, ReadAfterVecYLd], (instregex "^VCMPP(D|H|S)Z((256)?)rm(bi|ik)$",
2732 "^VCMPP(D|H|S)Z((256)?)rm(i|bik)$",
2733 "^VFPCLASSP(D|H|S)Z((256)?)rm(b?)k$",
2734 "^VPCMP(B|D|Q|W|UD|UQ|UW)Z((256)?)rmi(k?)$",
2735 "^VPCMP(D|Q|UQ)Z((256)?)rmib(k?)$",
2736 "^VPCMP(EQ|GT)(B|D|Q|W)Z((256)?)rm(k?)$",
2737 "^VPCMP(EQ|GT)(D|Q)Z((256)?)rmb(k?)$",
2738 "^VPCMPUBZ((256)?)rmi(k?)$",
2739 "^VPCMPUDZ((256)?)rmib(k?)$",
2740 "^VPTEST(N?)M(B|D|Q|W)Z((256)?)rm(k?)$",
2741 "^VPTEST(N?)M(D|Q)Z((256)?)rmb(k?)$")>;
2742 def : InstRW<[SPRWriteResGroup263, ReadAfterVecLd], (instregex "^VCMPS(D|H|S)Zrm$",
2743 "^VCMPS(D|H|S)Zrm_Int(k?)$",
2744 "^VFPCLASSS(D|H|S)Zrmk$")>;
2746 def SPRWriteResGroup264 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
2748 let NumMicroOps = 2;
2750 def : InstRW<[SPRWriteResGroup264, ReadAfterVecLd], (instregex "^V(U?)COMISHZrm((_Int)?)$")>;
2752 def SPRWriteResGroup265 : SchedWriteRes<[SPRPort04_09, SPRPort05, SPRPort07_08]> {
2753 let ReleaseAtCycles = [1, 2, 1];
2755 let NumMicroOps = 4;
2757 def : InstRW<[SPRWriteResGroup265], (instregex "^VCOMPRESSP(D|S)Z(128|256)mr$",
2758 "^VCOMPRESSP(D|S)Zmr$",
2759 "^VPCOMPRESS(D|Q)Z(128|256)mr$",
2760 "^VPCOMPRESS(D|Q)Zmr$",
2761 "^VPMOV(D|Q|W|SQ|SW)BZmr$",
2762 "^VPMOV((S|US)?)(D|Q)WZmr$",
2763 "^VPMOV(U?)S(DB|QD)Zmr$",
2764 "^VPMOVUS(Q|W)BZmr$")>;
2766 def SPRWriteResGroup266 : SchedWriteRes<[SPRPort04_09, SPRPort05, SPRPort07_08]> {
2767 let ReleaseAtCycles = [1, 2, 1];
2769 let NumMicroOps = 4;
2771 def : InstRW<[SPRWriteResGroup266], (instregex "^VCOMPRESSP(D|S)Z(128|256)mrk$",
2772 "^VCOMPRESSP(D|S)Zmrk$",
2773 "^VPCOMPRESS(D|Q)Z(128|256)mrk$",
2774 "^VPCOMPRESS(D|Q)Zmrk$",
2775 "^VPMOV(D|Q|W|SQ|SW)BZmrk$",
2776 "^VPMOV((S|US)?)(D|Q)WZmrk$",
2777 "^VPMOV(U?)S(DB|QD)Zmrk$",
2778 "^VPMOVUS(Q|W)BZmrk$")>;
2780 def SPRWriteResGroup267 : SchedWriteRes<[SPRPort05]> {
2781 let ReleaseAtCycles = [2];
2783 let NumMicroOps = 2;
2785 def : InstRW<[SPRWriteResGroup267], (instregex "^VCOMPRESSP(D|S)Z(128|256)rr$",
2786 "^VCOMPRESSP(D|S)Zrr$",
2787 "^VEXPANDP(D|S)Z(128|256)rr$",
2788 "^VEXPANDP(D|S)Zrr$",
2789 "^VPCOMPRESS(B|D|Q|W)Z(128|256)rr$",
2790 "^VPCOMPRESS(B|D|Q|W)Zrr$",
2791 "^VPEXPAND(B|D|Q|W)Z(128|256)rr$",
2792 "^VPEXPAND(B|D|Q|W)Zrr$")>;
2794 def SPRWriteResGroup268 : SchedWriteRes<[SPRPort00, SPRPort05]> {
2796 let NumMicroOps = 2;
2798 def : InstRW<[SPRWriteResGroup268], (instregex "^VCVT(U?)DQ2PDZrr((k|kz)?)$",
2799 "^VCVT(T?)PS2(U?)QQZrr((b|k|bk|kz)?)$",
2800 "^VCVT(T?)PS2(U?)QQZrrbkz$",
2801 "^VCVT(U?)QQ2PSZrr((b|k|bk|kz)?)$",
2802 "^VCVT(U?)QQ2PSZrrbkz$")>;
2804 def SPRWriteResGroup269 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2806 let NumMicroOps = 4;
2808 def : InstRW<[SPRWriteResGroup269], (instregex "^VCVT(U?)DQ2PHZ128rm(b?)$",
2809 "^VCVTNEPS2BF16Z128rm(b?)$")>;
2811 def SPRWriteResGroup270 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2813 let NumMicroOps = 4;
2815 def : InstRW<[SPRWriteResGroup270], (instregex "^VCVT(U?)DQ2PHZ128rm(bk|kz)$",
2816 "^VCVT(U?)DQ2PHZ128rm(k|bkz)$")>;
2818 def SPRWriteResGroup271 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort05]> {
2820 let NumMicroOps = 3;
2822 def : InstRW<[SPRWriteResGroup271], (instregex "^VCVT(U?)DQ2PHZ128rr$")>;
2824 def SPRWriteResGroup272 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort05]> {
2826 let NumMicroOps = 3;
2828 def : InstRW<[SPRWriteResGroup272], (instregex "^VCVT(U?)DQ2PHZ128rrk(z?)$")>;
2830 def SPRWriteResGroup273 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2832 let NumMicroOps = 4;
2834 def : InstRW<[SPRWriteResGroup273], (instregex "^VCVT(U?)DQ2PHZ256rm(b?)$",
2835 "^VCVTNEPS2BF16Z128rm(bk|kz)$",
2836 "^VCVTNEPS2BF16Z128rm(k|bkz)$")>;
2838 def SPRWriteResGroup274 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2840 let NumMicroOps = 4;
2842 def : InstRW<[SPRWriteResGroup274], (instregex "^VCVT(U?)DQ2PHZ256rm(bk|kz)$",
2843 "^VCVT(U?)DQ2PHZ256rm(k|bkz)$")>;
2845 def SPRWriteResGroup275 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort05]> {
2847 let NumMicroOps = 3;
2849 def : InstRW<[SPRWriteResGroup275], (instregex "^VCVT(U?)DQ2PHZ256rr$")>;
2851 def SPRWriteResGroup276 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort05]> {
2853 let NumMicroOps = 3;
2855 def : InstRW<[SPRWriteResGroup276], (instregex "^VCVT(U?)DQ2PHZ256rrk(z?)$")>;
2857 def SPRWriteResGroup277 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
2858 let ReleaseAtCycles = [1, 1, 2];
2860 let NumMicroOps = 4;
2862 def : InstRW<[SPRWriteResGroup277], (instregex "^VCVT(U?)DQ2PHZrm(b?)$")>;
2864 def SPRWriteResGroup278 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
2865 let ReleaseAtCycles = [1, 1, 2];
2867 let NumMicroOps = 4;
2869 def : InstRW<[SPRWriteResGroup278], (instregex "^VCVT(U?)DQ2PHZrm(bk|kz)$",
2870 "^VCVT(U?)DQ2PHZrm(k|bkz)$")>;
2872 def SPRWriteResGroup279 : SchedWriteRes<[SPRPort00, SPRPort05]> {
2873 let ReleaseAtCycles = [1, 2];
2875 let NumMicroOps = 3;
2877 def : InstRW<[SPRWriteResGroup279], (instregex "^VCVT(U?)DQ2PHZrr(b?)$")>;
2879 def SPRWriteResGroup280 : SchedWriteRes<[SPRPort00, SPRPort05]> {
2880 let ReleaseAtCycles = [1, 2];
2882 let NumMicroOps = 3;
2884 def : InstRW<[SPRWriteResGroup280], (instregex "^VCVT(U?)DQ2PHZrr(bk|kz)$",
2885 "^VCVT(U?)DQ2PHZrr(k|bkz)$")>;
2887 def SPRWriteResGroup281 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2888 let ReleaseAtCycles = [2, 1, 1, 1];
2890 let NumMicroOps = 5;
2892 def : InstRW<[SPRWriteResGroup281, ReadAfterVecXLd], (instregex "^VCVTNE2PS2BF16Z128rm(b?)$")>;
2894 def SPRWriteResGroup282 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2895 let ReleaseAtCycles = [2, 1, 1, 1];
2897 let NumMicroOps = 5;
2899 def : InstRW<[SPRWriteResGroup282, ReadAfterVecXLd], (instregex "^VCVTNE2PS2BF16Z128rm(bk|kz)$",
2900 "^VCVTNE2PS2BF16Z128rm(k|bkz)$")>;
2902 def SPRWriteResGroup283 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort05]> {
2903 let ReleaseAtCycles = [2, 1, 1];
2905 let NumMicroOps = 4;
2907 def : InstRW<[SPRWriteResGroup283], (instregex "^VCVTNE2PS2BF16Z(128|256)rr$")>;
2909 def SPRWriteResGroup284 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort05]> {
2910 let ReleaseAtCycles = [2, 1, 1];
2912 let NumMicroOps = 4;
2914 def : InstRW<[SPRWriteResGroup284], (instregex "^VCVTNE2PS2BF16Z(128|256)rrk(z?)$")>;
2916 def SPRWriteResGroup285 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2917 let ReleaseAtCycles = [2, 1, 1, 1];
2919 let NumMicroOps = 5;
2921 def : InstRW<[SPRWriteResGroup285, ReadAfterVecYLd], (instregex "^VCVTNE2PS2BF16Z256rm(b?)$")>;
2923 def SPRWriteResGroup286 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2924 let ReleaseAtCycles = [2, 1, 1, 1];
2926 let NumMicroOps = 5;
2928 def : InstRW<[SPRWriteResGroup286, ReadAfterVecYLd], (instregex "^VCVTNE2PS2BF16Z256rm(bk|kz)$",
2929 "^VCVTNE2PS2BF16Z256rm(k|bkz)$")>;
2931 def SPRWriteResGroup287 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
2932 let ReleaseAtCycles = [2, 1, 2];
2934 let NumMicroOps = 5;
2936 def : InstRW<[SPRWriteResGroup287, ReadAfterVecYLd], (instregex "^VCVTNE2PS2BF16Zrm(b?)$",
2937 "^VDPBF16PSZm((b|k|bk|kz)?)$")>;
2938 def : InstRW<[SPRWriteResGroup287, ReadAfterVecYLd], (instrs VDPBF16PSZmbkz)>;
2940 def SPRWriteResGroup288 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
2941 let ReleaseAtCycles = [2, 1, 2];
2943 let NumMicroOps = 5;
2945 def : InstRW<[SPRWriteResGroup288, ReadAfterVecYLd], (instregex "^VCVTNE2PS2BF16Zrm(bk|kz)$",
2946 "^VCVTNE2PS2BF16Zrm(k|bkz)$")>;
2948 def SPRWriteResGroup289 : SchedWriteRes<[SPRPort00, SPRPort05]> {
2949 let ReleaseAtCycles = [2, 2];
2951 let NumMicroOps = 4;
2953 def : InstRW<[SPRWriteResGroup289], (instregex "^VDPBF16PSZr((k|kz)?)$")>;
2954 def : InstRW<[SPRWriteResGroup289], (instrs VCVTNE2PS2BF16Zrr)>;
2956 def SPRWriteResGroup290 : SchedWriteRes<[SPRPort00, SPRPort05]> {
2957 let ReleaseAtCycles = [2, 2];
2959 let NumMicroOps = 4;
2961 def : InstRW<[SPRWriteResGroup290], (instregex "^VCVTNE2PS2BF16Zrrk(z?)$")>;
2963 def SPRWriteResGroup291 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort05]> {
2965 let NumMicroOps = 3;
2967 def : InstRW<[SPRWriteResGroup291], (instregex "^VCVTNEPS2BF16Z(128|256)rr$")>;
2969 def SPRWriteResGroup292 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort05]> {
2971 let NumMicroOps = 3;
2973 def : InstRW<[SPRWriteResGroup292], (instregex "^VCVTNEPS2BF16Z(128|256)rrk(z?)$")>;
2975 def SPRWriteResGroup293 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2977 let NumMicroOps = 4;
2979 def : InstRW<[SPRWriteResGroup293], (instregex "^VCVTNEPS2BF16Z256rm(b?)$")>;
2981 def SPRWriteResGroup294 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
2983 let NumMicroOps = 4;
2985 def : InstRW<[SPRWriteResGroup294], (instregex "^VCVTNEPS2BF16Z256rm(bk|kz)$",
2986 "^VCVTNEPS2BF16Z256rm(k|bkz)$")>;
2988 def SPRWriteResGroup295 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
2989 let ReleaseAtCycles = [1, 1, 2];
2991 let NumMicroOps = 4;
2993 def : InstRW<[SPRWriteResGroup295], (instregex "^VCVTNEPS2BF16Zrm(b?)$")>;
2995 def SPRWriteResGroup296 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
2996 let ReleaseAtCycles = [1, 1, 2];
2998 let NumMicroOps = 4;
3000 def : InstRW<[SPRWriteResGroup296], (instregex "^VCVTNEPS2BF16Zrm(bk|kz)$",
3001 "^VCVTNEPS2BF16Zrm(k|bkz)$")>;
3003 def SPRWriteResGroup297 : SchedWriteRes<[SPRPort00, SPRPort05]> {
3004 let ReleaseAtCycles = [1, 2];
3006 let NumMicroOps = 3;
3008 def : InstRW<[SPRWriteResGroup297], (instrs VCVTNEPS2BF16Zrr)>;
3010 def SPRWriteResGroup298 : SchedWriteRes<[SPRPort00, SPRPort05]> {
3011 let ReleaseAtCycles = [1, 2];
3013 let NumMicroOps = 3;
3015 def : InstRW<[SPRWriteResGroup298], (instregex "^VCVTNEPS2BF16Zrrk(z?)$")>;
3017 def SPRWriteResGroup299 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3019 let NumMicroOps = 3;
3021 def : InstRW<[SPRWriteResGroup299], (instregex "^VCVT(T?)PD2DQYrm$",
3022 "^VCVT(T?)P(D|H)2(U?)DQZ256rm(b?)$",
3023 "^VCVT(T?)PD2(U?)DQZ256rm(bk|kz)$",
3024 "^VCVT(T?)PD2(U?)DQZ256rm(k|bkz)$",
3025 "^VCVTPH2PSXZ128rm(bk|kz)$",
3026 "^VCVTPH2PSXZ128rm(k|bkz)$",
3027 "^VCVTPH2PSXZ256rm(b?)$",
3028 "^VCVT(U?)QQ2PSZ256rm((b|k|bk|kz)?)$",
3029 "^VCVT(U?)QQ2PSZ256rmbkz$")>;
3031 def SPRWriteResGroup300 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
3033 let NumMicroOps = 3;
3035 def : InstRW<[SPRWriteResGroup300], (instregex "^VCVT(T?)P(D|H)2(U?)DQZrm(b?)$",
3036 "^VCVT(T?)PD2(U?)DQZrm(bk|kz)$",
3037 "^VCVT(T?)PD2(U?)DQZrm(k|bkz)$",
3038 "^VCVTPH2PSXZrm(b?)$",
3039 "^VCVT(U?)QQ2PSZrm((b|k|bk|kz)?)$",
3040 "^VCVT(U?)QQ2PSZrmbkz$")>;
3042 def SPRWriteResGroup301 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3043 let ReleaseAtCycles = [2, 1, 1, 1, 2];
3045 let NumMicroOps = 7;
3047 def : InstRW<[SPRWriteResGroup301], (instregex "^VCVTPD2PHZ128rm(b?)$")>;
3049 def SPRWriteResGroup302 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3050 let ReleaseAtCycles = [2, 1, 1, 1, 2];
3052 let NumMicroOps = 7;
3054 def : InstRW<[SPRWriteResGroup302], (instregex "^VCVTPD2PHZ128rm(bk|kz)$",
3055 "^VCVTPD2PHZ128rm(k|bkz)$")>;
3057 def SPRWriteResGroup303 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort05]> {
3058 let ReleaseAtCycles = [2, 1, 2];
3060 let NumMicroOps = 5;
3062 def : InstRW<[SPRWriteResGroup303], (instrs VCVTPD2PHZ128rr)>;
3064 def SPRWriteResGroup304 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort05]> {
3065 let ReleaseAtCycles = [2, 1, 2];
3067 let NumMicroOps = 5;
3069 def : InstRW<[SPRWriteResGroup304], (instregex "^VCVTPD2PHZ128rrk(z?)$")>;
3071 def SPRWriteResGroup305 : SchedWriteRes<[SPRPort00_01, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3072 let ReleaseAtCycles = [2, 1, 1, 2];
3074 let NumMicroOps = 6;
3076 def : InstRW<[SPRWriteResGroup305], (instregex "^VCVTPD2PHZ256rm(b?)$")>;
3078 def SPRWriteResGroup306 : SchedWriteRes<[SPRPort00_01, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3079 let ReleaseAtCycles = [2, 1, 1, 2];
3081 let NumMicroOps = 6;
3083 def : InstRW<[SPRWriteResGroup306], (instregex "^VCVTPD2PHZ256rm(bk|kz)$",
3084 "^VCVTPD2PHZ256rm(k|bkz)$")>;
3086 def SPRWriteResGroup307 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3087 let ReleaseAtCycles = [2, 2];
3089 let NumMicroOps = 4;
3091 def : InstRW<[SPRWriteResGroup307], (instrs VCVTPD2PHZ256rr)>;
3093 def SPRWriteResGroup308 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3094 let ReleaseAtCycles = [2, 2];
3096 let NumMicroOps = 4;
3098 def : InstRW<[SPRWriteResGroup308], (instregex "^VCVTPD2PHZ256rrk(z?)$")>;
3100 def SPRWriteResGroup309 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3101 let ReleaseAtCycles = [2, 1, 1, 2];
3103 let NumMicroOps = 6;
3105 def : InstRW<[SPRWriteResGroup309], (instregex "^VCVTP(D2PH|H2PD)Zrm(b?)$")>;
3107 def SPRWriteResGroup310 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3108 let ReleaseAtCycles = [2, 1, 1, 2];
3110 let NumMicroOps = 6;
3112 def : InstRW<[SPRWriteResGroup310], (instregex "^VCVTP(D2PH|H2PD)Zrm(bk|kz)$",
3113 "^VCVTP(D2PH|H2PD)Zrm(k|bkz)$")>;
3115 def SPRWriteResGroup311 : SchedWriteRes<[SPRPort00, SPRPort05]> {
3116 let ReleaseAtCycles = [2, 2];
3118 let NumMicroOps = 4;
3120 def : InstRW<[SPRWriteResGroup311], (instregex "^VCVTP(D2PH|H2PD)Zrr(b?)$")>;
3122 def SPRWriteResGroup312 : SchedWriteRes<[SPRPort00, SPRPort05]> {
3123 let ReleaseAtCycles = [2, 2];
3125 let NumMicroOps = 4;
3127 def : InstRW<[SPRWriteResGroup312], (instregex "^VCVTP(D2PH|H2PD)Zrr(bk|kz)$",
3128 "^VCVTP(D2PH|H2PD)Zrr(k|bkz)$")>;
3130 def SPRWriteResGroup313 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
3132 let NumMicroOps = 2;
3134 def : InstRW<[SPRWriteResGroup313], (instregex "^VCVT(T?)PD2(U?)QQZ128rm((b|k|bk|kz)?)$",
3135 "^VCVT(T?)PD2(U?)QQZ128rmbkz$",
3136 "^VPABS(B|W)Z(128|256)rmk(z?)$",
3137 "^VPLZCNT(D|Q)Z128rm((b|k|bk|kz)?)$",
3138 "^VPLZCNT(D|Q)Z128rmbkz$",
3139 "^VPS(L|R)LWZ(128|256)mik(z?)$",
3140 "^VPSRAWZ(128|256)mik(z?)$")>;
3141 def : InstRW<[SPRWriteResGroup313, ReadAfterVecLd], (instregex "^VFIXUPIMMS(D|S)Zrmi((k|kz)?)$",
3142 "^VSCALEFS(D|S)Zrm((k|kz)?)$")>;
3143 def : InstRW<[SPRWriteResGroup313, ReadAfterVecXLd], (instregex "^VP(ADD|SUB)(U?)S(B|W)Z128rmk(z?)$",
3144 "^VPAVG(B|W)Z128rmk(z?)$",
3145 "^VPM(AX|IN)(SB|UW)Z128rmk(z?)$",
3146 "^VPM(AX|IN)(SW|UB)Z128rmk(z?)$",
3147 "^VPSH(L|R)DVWZ128mk(z?)$",
3148 "^VPS(L|R)L(V?)WZ128rmk(z?)$",
3149 "^VPSRA(V?)WZ128rmk(z?)$")>;
3150 def : InstRW<[SPRWriteResGroup313, ReadAfterVecYLd], (instregex "^VP(ADD|SUB)(U?)S(B|W)Z256rmk(z?)$",
3151 "^VPAVG(B|W)Z256rmk(z?)$",
3152 "^VPM(AX|IN)(SB|UW)Z256rmk(z?)$",
3153 "^VPM(AX|IN)(SW|UB)Z256rmk(z?)$",
3154 "^VPSH(L|R)DVWZ256mk(z?)$",
3155 "^VPS(L|R)L(V?)WZ256rmk(z?)$",
3156 "^VPSRA(V?)WZ256rmk(z?)$")>;
3157 def : InstRW<[SPRWriteResGroup313, ReadAfterVecXLd, ReadAfterVecXLd], (instregex "^VPMADD52(H|L)UQZ128m((b|k|bk|kz)?)$",
3158 "^VPMADD52(H|L)UQZ128mbkz$")>;
3160 def SPRWriteResGroup314 : SchedWriteRes<[SPRPort00_01]> {
3163 def : InstRW<[SPRWriteResGroup314], (instregex "^VCVT(T?)PD2(U?)QQZ(128|256)rr((k|kz)?)$",
3164 "^VCVT(U?)QQ2PDZ(128|256)rr((k|kz)?)$",
3165 "^VFIXUPIMMS(D|S)Zrri((k|kz)?)$",
3166 "^VPLZCNT(D|Q)Z(128|256)rr((k|kz)?)$",
3167 "^VPMADD52(H|L)UQZ(128|256)r((k|kz)?)$",
3168 "^VSCALEFS(D|S)Zrr((k|kz)?)$",
3169 "^VSCALEFS(D|S)Zrrb_Int((k|kz)?)$")>;
3170 def : InstRW<[SPRWriteResGroup314, ReadAfterVecLd], (instregex "^VFIXUPIMMS(D|S)Zrrib((k|kz)?)$")>;
3172 def SPRWriteResGroup315 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3174 let NumMicroOps = 3;
3176 def : InstRW<[SPRWriteResGroup315], (instregex "^VCVT(T?)PH2(U?)DQZ128rm(b?)$",
3177 "^VCVTPS2PHXZ128rm(b?)$")>;
3179 def SPRWriteResGroup316 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3181 let NumMicroOps = 3;
3183 def : InstRW<[SPRWriteResGroup316], (instregex "^VCVT(T?)PH2(U?)DQZ128rm(bk|kz)$",
3184 "^VCVT(T?)PH2(U?)DQZ128rm(k|bkz)$")>;
3186 def SPRWriteResGroup317 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3188 let NumMicroOps = 2;
3190 def : InstRW<[SPRWriteResGroup317], (instregex "^VCVT(T?)PH2(U?)DQZ(128|256)rrk(z?)$",
3191 "^VCVTP(H2PS|S2PH)(X?)Z256rrk(z?)$")>;
3193 def SPRWriteResGroup318 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3195 let NumMicroOps = 3;
3197 def : InstRW<[SPRWriteResGroup318], (instregex "^VCVT(T?)PH2(U?)DQZ256rm(bk|kz)$",
3198 "^VCVT(T?)PH2(U?)DQZ256rm(k|bkz)$",
3199 "^VCVTP(H2PS|S2PH)XZ256rm(bk|kz)$",
3200 "^VCVTP(H2PS|S2PH)XZ256rm(k|bkz)$")>;
3202 def SPRWriteResGroup319 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
3204 let NumMicroOps = 3;
3206 def : InstRW<[SPRWriteResGroup319], (instregex "^VCVT(T?)PH2(U?)DQZrm(bk|kz)$",
3207 "^VCVT(T?)PH2(U?)DQZrm(k|bkz)$",
3208 "^VCVTP(H2PS|S2PH)XZrm(bk|kz)$",
3209 "^VCVTP(H2PS|S2PH)XZrm(k|bkz)$")>;
3211 def SPRWriteResGroup320 : SchedWriteRes<[SPRPort00, SPRPort05]> {
3213 let NumMicroOps = 2;
3215 def : InstRW<[SPRWriteResGroup320], (instregex "^VCVT(T?)PH2(U?)DQZrr(b?)$",
3216 "^VCVTP(H2PS|S2PH)(X?)Zrr(b?)$",
3217 "^VPSHUFBITQMBZ(128|256)rrk$")>;
3218 def : InstRW<[SPRWriteResGroup320], (instrs VPSHUFBITQMBZrrk)>;
3220 def SPRWriteResGroup321 : SchedWriteRes<[SPRPort00, SPRPort05]> {
3222 let NumMicroOps = 2;
3224 def : InstRW<[SPRWriteResGroup321], (instregex "^VCVT(T?)PH2(U?)DQZrr(bk|kz)$",
3225 "^VCVT(T?)PH2(U?)DQZrr(k|bkz)$",
3226 "^VCVTP(H2PS|S2PH)XZrr(bk|kz)$",
3227 "^VCVTP(H2PS|S2PH)XZrr(k|bkz)$")>;
3229 def SPRWriteResGroup322 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3230 let ReleaseAtCycles = [2, 1, 1, 1, 2];
3232 let NumMicroOps = 7;
3234 def : InstRW<[SPRWriteResGroup322], (instregex "^VCVTPH2PDZ128rm(b?)$")>;
3236 def SPRWriteResGroup323 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3237 let ReleaseAtCycles = [2, 1, 1, 1, 2];
3239 let NumMicroOps = 7;
3241 def : InstRW<[SPRWriteResGroup323], (instregex "^VCVTPH2PDZ128rm(bk|kz)$",
3242 "^VCVTPH2PDZ128rm(k|bkz)$")>;
3244 def SPRWriteResGroup324 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort05]> {
3245 let ReleaseAtCycles = [2, 1, 1, 2];
3247 let NumMicroOps = 6;
3249 def : InstRW<[SPRWriteResGroup324], (instrs VCVTPH2PDZ128rr)>;
3251 def SPRWriteResGroup325 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort05]> {
3252 let ReleaseAtCycles = [2, 1, 1, 2];
3254 let NumMicroOps = 6;
3256 def : InstRW<[SPRWriteResGroup325], (instregex "^VCVTPH2PDZ128rrk(z?)$")>;
3258 def SPRWriteResGroup326 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3259 let ReleaseAtCycles = [2, 1, 2];
3261 let NumMicroOps = 5;
3263 def : InstRW<[SPRWriteResGroup326], (instregex "^VCVTPH2PDZ256rm(b?)$")>;
3265 def SPRWriteResGroup327 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3266 let ReleaseAtCycles = [2, 1, 2];
3268 let NumMicroOps = 5;
3270 def : InstRW<[SPRWriteResGroup327], (instregex "^VCVTPH2PDZ256rm(bk|kz)$",
3271 "^VCVTPH2PDZ256rm(k|bkz)$")>;
3273 def SPRWriteResGroup328 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3274 let ReleaseAtCycles = [2, 2];
3276 let NumMicroOps = 4;
3278 def : InstRW<[SPRWriteResGroup328], (instrs VCVTPH2PDZ256rr)>;
3280 def SPRWriteResGroup329 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3281 let ReleaseAtCycles = [2, 2];
3283 let NumMicroOps = 4;
3285 def : InstRW<[SPRWriteResGroup329], (instregex "^VCVTPH2PDZ256rrk(z?)$")>;
3287 def SPRWriteResGroup330 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3289 let NumMicroOps = 2;
3291 def : InstRW<[SPRWriteResGroup330], (instregex "^VCVTP(H2PS|S2PH)(X?)Z128rrk(z?)$")>;
3293 def SPRWriteResGroup331 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
3295 let NumMicroOps = 2;
3297 def : InstRW<[SPRWriteResGroup331], (instregex "^VCVTPH2PSZ(128|256)rmk(z?)$")>;
3298 def : InstRW<[SPRWriteResGroup331, ReadAfterVecLd], (instregex "^VCVTSH2SSZrm_Intk(z?)$")>;
3299 def : InstRW<[SPRWriteResGroup331, ReadAfterVecXLd], (instregex "^VPMADDUBSWZ128rmk(z?)$",
3300 "^VPMULH((U|RS)?)WZ128rmk(z?)$",
3301 "^VPMULLWZ128rmk(z?)$")>;
3302 def : InstRW<[SPRWriteResGroup331, ReadAfterVecYLd], (instregex "^VPMADDUBSWZ256rmk(z?)$",
3303 "^VPMULH((U|RS)?)WZ256rmk(z?)$",
3304 "^VPMULLWZ256rmk(z?)$")>;
3306 def SPRWriteResGroup332 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
3308 let NumMicroOps = 3;
3310 def : InstRW<[SPRWriteResGroup332], (instregex "^VCVT(T?)PS2(U?)QQZrm((b|k|bk|kz)?)$",
3311 "^VCVT(T?)PS2(U?)QQZrmbkz$")>;
3312 def : InstRW<[SPRWriteResGroup332], (instrs VCVTPH2PSZrm)>;
3313 def : InstRW<[SPRWriteResGroup332, ReadAfterVecYLd], (instregex "^VPERMWZrmk(z?)$")>;
3315 def SPRWriteResGroup333 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3316 let ReleaseAtCycles = [1, 2, 1, 1, 1];
3318 let NumMicroOps = 6;
3320 def : InstRW<[SPRWriteResGroup333], (instregex "^VCVT(T?)PH2(U?)QQZ128rm((b|k|bk|kz)?)$",
3321 "^VCVT(T?)PH2(U?)QQZ128rmbkz$")>;
3323 def SPRWriteResGroup334 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort05]> {
3324 let ReleaseAtCycles = [1, 2, 1];
3326 let NumMicroOps = 4;
3328 def : InstRW<[SPRWriteResGroup334], (instregex "^VCVT(T?)PH2(U?)QQZ(128|256)rr((k|kz)?)$")>;
3330 def SPRWriteResGroup335 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3331 let ReleaseAtCycles = [1, 2, 1, 1, 1];
3333 let NumMicroOps = 6;
3335 def : InstRW<[SPRWriteResGroup335], (instregex "^VCVT(T?)PH2(U?)QQZ256rm((b|k|bk|kz)?)$",
3336 "^VCVT(T?)PH2(U?)QQZ256rmbkz$")>;
3338 def SPRWriteResGroup336 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3340 let NumMicroOps = 3;
3342 def : InstRW<[SPRWriteResGroup336], (instregex "^VCVTPS2PHXZ128rm(bk|kz)$",
3343 "^VCVTPS2PHXZ128rm(k|bkz)$",
3344 "^VCVTPS2PHXZ256rm(b?)$")>;
3346 def SPRWriteResGroup337 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
3348 let NumMicroOps = 3;
3350 def : InstRW<[SPRWriteResGroup337], (instregex "^VCVTPS2PHXZrm(b?)$")>;
3352 def SPRWriteResGroup338 : SchedWriteRes<[SPRPort00_01, SPRPort04_09, SPRPort07_08]> {
3354 let NumMicroOps = 3;
3356 def : InstRW<[SPRWriteResGroup338], (instregex "^VCVTPS2PHZ(128|256)mrk$")>;
3358 def SPRWriteResGroup339 : SchedWriteRes<[SPRPort00, SPRPort04_09, SPRPort07_08]> {
3360 let NumMicroOps = 3;
3362 def : InstRW<[SPRWriteResGroup339], (instrs VCVTPS2PHZmrk)>;
3364 def SPRWriteResGroup340 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3366 let NumMicroOps = 2;
3368 def : InstRW<[SPRWriteResGroup340], (instregex "^VCVT(T?)PS2(U?)QQZ128rr((k|kz)?)$",
3369 "^VCVT(U?)QQ2PSZ128rr((k|kz)?)$")>;
3371 def SPRWriteResGroup341 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
3373 let NumMicroOps = 5;
3375 def : InstRW<[SPRWriteResGroup341], (instregex "^VCVT(U?)QQ2PHZ128rm(b?)$")>;
3377 def SPRWriteResGroup342 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
3379 let NumMicroOps = 5;
3381 def : InstRW<[SPRWriteResGroup342], (instregex "^VCVT(U?)QQ2PHZ128rm(bk|kz)$",
3382 "^VCVT(U?)QQ2PHZ128rm(k|bkz)$")>;
3384 def SPRWriteResGroup343 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort05]> {
3386 let NumMicroOps = 4;
3388 def : InstRW<[SPRWriteResGroup343], (instregex "^VCVT(U?)QQ2PHZ128rr$")>;
3390 def SPRWriteResGroup344 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort05]> {
3392 let NumMicroOps = 4;
3394 def : InstRW<[SPRWriteResGroup344], (instregex "^VCVT(U?)QQ2PHZ128rrk(z?)$",
3395 "^VCVT(U?)QQ2PHZ256rr$")>;
3397 def SPRWriteResGroup345 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
3399 let NumMicroOps = 5;
3401 def : InstRW<[SPRWriteResGroup345], (instregex "^VCVT(U?)QQ2PHZ256rm(b?)$")>;
3403 def SPRWriteResGroup346 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
3405 let NumMicroOps = 5;
3407 def : InstRW<[SPRWriteResGroup346], (instregex "^VCVT(U?)QQ2PHZ256rm(bk|kz)$",
3408 "^VCVT(U?)QQ2PHZ256rm(k|bkz)$")>;
3410 def SPRWriteResGroup347 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort05]> {
3412 let NumMicroOps = 4;
3414 def : InstRW<[SPRWriteResGroup347], (instregex "^VCVT(U?)QQ2PHZ256rrk(z?)$")>;
3416 def SPRWriteResGroup348 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
3417 let ReleaseAtCycles = [1, 1, 1, 2];
3419 let NumMicroOps = 5;
3421 def : InstRW<[SPRWriteResGroup348], (instregex "^VCVT(U?)QQ2PHZrm(b?)$")>;
3423 def SPRWriteResGroup349 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
3424 let ReleaseAtCycles = [1, 1, 1, 2];
3426 let NumMicroOps = 5;
3428 def : InstRW<[SPRWriteResGroup349], (instregex "^VCVT(U?)QQ2PHZrm(bk|kz)$",
3429 "^VCVT(U?)QQ2PHZrm(k|bkz)$")>;
3431 def SPRWriteResGroup350 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort05]> {
3432 let ReleaseAtCycles = [1, 1, 2];
3434 let NumMicroOps = 4;
3436 def : InstRW<[SPRWriteResGroup350], (instregex "^VCVT(U?)QQ2PHZrr(b?)$")>;
3438 def SPRWriteResGroup351 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort05]> {
3439 let ReleaseAtCycles = [1, 1, 2];
3441 let NumMicroOps = 4;
3443 def : InstRW<[SPRWriteResGroup351], (instregex "^VCVT(U?)QQ2PHZrr(bk|kz)$",
3444 "^VCVT(U?)QQ2PHZrr(k|bkz)$")>;
3446 def SPRWriteResGroup352 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3447 let ReleaseAtCycles = [2, 2, 1, 1, 1];
3449 let NumMicroOps = 7;
3451 def : InstRW<[SPRWriteResGroup352, ReadAfterVecLd], (instregex "^VCVTSD2SHZrm((_Int)?)$")>;
3453 def SPRWriteResGroup353 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3454 let ReleaseAtCycles = [2, 2, 1, 1, 1];
3456 let NumMicroOps = 7;
3458 def : InstRW<[SPRWriteResGroup353, ReadAfterVecLd], (instregex "^VCVTSD2SHZrm_Intk(z?)$")>;
3460 def SPRWriteResGroup354 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort05]> {
3461 let ReleaseAtCycles = [2, 1, 1];
3463 let NumMicroOps = 4;
3465 def : InstRW<[SPRWriteResGroup354], (instregex "^VCVTSD2SHZrr(b?)_Int$")>;
3466 def : InstRW<[SPRWriteResGroup354], (instrs VCVTSD2SHZrr)>;
3468 def SPRWriteResGroup355 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort05]> {
3469 let ReleaseAtCycles = [2, 1, 1];
3471 let NumMicroOps = 4;
3473 def : InstRW<[SPRWriteResGroup355], (instregex "^VCVTSD2SHZrr(b?)_Intk(z?)$")>;
3475 def SPRWriteResGroup356 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3476 let ReleaseAtCycles = [2, 1, 1];
3478 let NumMicroOps = 4;
3480 def : InstRW<[SPRWriteResGroup356, ReadAfterVecLd], (instregex "^VCVTSH2SDZrm((_Int)?)$")>;
3482 def SPRWriteResGroup357 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3483 let ReleaseAtCycles = [2, 1, 1];
3485 let NumMicroOps = 4;
3487 def : InstRW<[SPRWriteResGroup357, ReadAfterVecLd], (instregex "^VCVTSH2SDZrm_Intk(z?)$")>;
3489 def SPRWriteResGroup358 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3490 let ReleaseAtCycles = [2, 1];
3492 let NumMicroOps = 3;
3494 def : InstRW<[SPRWriteResGroup358], (instregex "^VCVTSH2SDZrr(b?)_Int$")>;
3495 def : InstRW<[SPRWriteResGroup358], (instrs VCVTSH2SDZrr)>;
3497 def SPRWriteResGroup359 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3498 let ReleaseAtCycles = [2, 1];
3500 let NumMicroOps = 3;
3502 def : InstRW<[SPRWriteResGroup359], (instregex "^VCVTSH2SDZrr(b?)_Intk(z?)$")>;
3504 def SPRWriteResGroup360 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort02_03_11]> {
3506 let NumMicroOps = 3;
3508 def : InstRW<[SPRWriteResGroup360, ReadAfterVecLd], (instregex "^VCVT(T?)SH2(U?)SI((64)?)Zrm_Int$",
3509 "^VCVTTSH2(U?)SI((64)?)Zrm$")>;
3511 def SPRWriteResGroup361 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05]> {
3513 let NumMicroOps = 3;
3515 def : InstRW<[SPRWriteResGroup361], (instregex "^VCVT(T?)SH2(U?)SI((64)?)Zrr(b?)_Int$",
3516 "^VCVTTSH2(U?)SI((64)?)Zrr$")>;
3518 def SPRWriteResGroup362 : SchedWriteRes<[SPRPort00_01]> {
3521 def : InstRW<[SPRWriteResGroup362], (instregex "^VCVTSH2SSZrr(b?)_Intk(z?)$")>;
3523 def SPRWriteResGroup363 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort02_03_11]> {
3525 let NumMicroOps = 3;
3527 def : InstRW<[SPRWriteResGroup363, ReadAfterVecLd], (instregex "^VCVT(U?)SI((64)?)2SHZrm((_Int)?)$",
3528 "^VCVTSS2SHZrm((_Int)?)$")>;
3530 def SPRWriteResGroup364 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort02_03_11]> {
3532 let NumMicroOps = 3;
3534 def : InstRW<[SPRWriteResGroup364, ReadAfterVecLd], (instregex "^VCVTSS2SHZrm_Intk(z?)$")>;
3536 def SPRWriteResGroup365 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05]> {
3538 let NumMicroOps = 2;
3540 def : InstRW<[SPRWriteResGroup365], (instregex "^VCVTSS2SHZrr(b?)_Int$")>;
3541 def : InstRW<[SPRWriteResGroup365], (instrs VCVTSS2SHZrr)>;
3543 def SPRWriteResGroup366 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05]> {
3545 let NumMicroOps = 2;
3547 def : InstRW<[SPRWriteResGroup366], (instregex "^VCVTSS2SHZrr(b?)_Intk(z?)$")>;
3549 def SPRWriteResGroup367 : SchedWriteRes<[SPRPort05]> {
3552 def : InstRW<[SPRWriteResGroup367], (instregex "^VDBPSADBWZ(128|256)rrik(z?)$",
3553 "^VDBPSADBWZrrik(z?)$",
3554 "^VPACK(S|U)S(DW|WB)Z(128|256)rrk(z?)$",
3555 "^VPACK(S|U)S(DW|WB)Zrrk(z?)$",
3556 "^VPBROADCAST(B|W|Dr|Qr|Wr)Z((256)?)rrk(z?)$",
3557 "^VPBROADCAST(B|D|Q|W)rZ(128|256)rr$",
3558 "^VPBROADCASTBrZ(128|256)rrk(z?)$",
3559 "^VPBROADCAST(B|D|Q|W)rZrr$",
3560 "^VPBROADCASTBrZrrk(z?)$",
3561 "^VPBROADCAST(D|Q|W)rZ128rrk(z?)$",
3562 "^VPERMBZ(128|256)rrk(z?)$",
3564 "^VPMOV(S|Z)XBWZ((256)?)rrk(z?)$",
3565 "^VPMULTISHIFTQBZ(128|256)rrk(z?)$",
3566 "^VPMULTISHIFTQBZrrk(z?)$",
3567 "^VPOPCNT(B|W)Z(128|256)rrk(z?)$",
3568 "^VPOPCNT(B|W)Zrrk(z?)$")>;
3570 def SPRWriteResGroup368 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort02_03_11]> {
3571 let ReleaseAtCycles = [2, 1, 1];
3573 let NumMicroOps = 4;
3575 def : InstRW<[SPRWriteResGroup368, ReadAfterVecXLd], (instregex "^VDIVPHZ128rm(b?)$")>;
3577 def SPRWriteResGroup369 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort02_03_11]> {
3578 let ReleaseAtCycles = [2, 1, 1];
3580 let NumMicroOps = 4;
3582 def : InstRW<[SPRWriteResGroup369, ReadAfterVecXLd], (instregex "^VDIVPHZ128rm(bk|kz)$",
3583 "^VDIVPHZ128rm(k|bkz)$")>;
3585 def SPRWriteResGroup370 : SchedWriteRes<[SPRPort00, SPRPort00_01_05]> {
3586 let ReleaseAtCycles = [2, 1];
3588 let NumMicroOps = 3;
3590 def : InstRW<[SPRWriteResGroup370], (instregex "^VDIVPHZ(128|256)rr$")>;
3592 def SPRWriteResGroup371 : SchedWriteRes<[SPRPort00, SPRPort00_01_05]> {
3593 let ReleaseAtCycles = [2, 1];
3595 let NumMicroOps = 3;
3597 def : InstRW<[SPRWriteResGroup371], (instregex "^VDIVPHZ(128|256)rrk$",
3598 "^VSQRTPHZ(128|256)r$")>;
3599 def : InstRW<[SPRWriteResGroup371], (instrs VDIVPHZ128rrkz)>;
3601 def SPRWriteResGroup372 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort02_03_11]> {
3602 let ReleaseAtCycles = [2, 1, 1];
3604 let NumMicroOps = 4;
3606 def : InstRW<[SPRWriteResGroup372, ReadAfterVecYLd], (instregex "^VDIVPHZ256rm(b?)$")>;
3608 def SPRWriteResGroup373 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort02_03_11]> {
3609 let ReleaseAtCycles = [2, 1, 1];
3611 let NumMicroOps = 4;
3613 def : InstRW<[SPRWriteResGroup373, ReadAfterVecYLd], (instregex "^VDIVPHZ256rm(bk|kz)$",
3614 "^VDIVPHZ256rm(k|bkz)$")>;
3615 def : InstRW<[SPRWriteResGroup373, ReadAfterVecXLd], (instregex "^VSQRTPHZ128m(b?)$")>;
3617 def SPRWriteResGroup374 : SchedWriteRes<[SPRPort00, SPRPort00_01_05]> {
3618 let ReleaseAtCycles = [2, 1];
3620 let NumMicroOps = 3;
3622 def : InstRW<[SPRWriteResGroup374], (instrs VDIVPHZ256rrkz)>;
3624 def SPRWriteResGroup375 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3625 let ReleaseAtCycles = [4, 2, 1, 1, 1];
3627 let NumMicroOps = 9;
3629 def : InstRW<[SPRWriteResGroup375, ReadAfterVecYLd], (instregex "^VDIVPHZrm(b?)$")>;
3631 def SPRWriteResGroup376 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
3632 let ReleaseAtCycles = [4, 2, 1, 1, 1];
3634 let NumMicroOps = 9;
3636 def : InstRW<[SPRWriteResGroup376, ReadAfterVecYLd], (instregex "^VDIVPHZrm(bk|kz)$",
3637 "^VDIVPHZrm(k|bkz)$")>;
3639 def SPRWriteResGroup377 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort05]> {
3640 let ReleaseAtCycles = [4, 1, 1];
3642 let NumMicroOps = 6;
3644 def : InstRW<[SPRWriteResGroup377], (instregex "^VDIVPHZrr(b?)$")>;
3646 def SPRWriteResGroup378 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort05]> {
3647 let ReleaseAtCycles = [4, 1, 1];
3649 let NumMicroOps = 6;
3651 def : InstRW<[SPRWriteResGroup378], (instregex "^VDIVPHZrr(bk|kz)$",
3652 "^VDIVPHZrr(k|bkz)$")>;
3654 def SPRWriteResGroup379 : SchedWriteRes<[SPRPort00, SPRPort00_05]> {
3655 let ReleaseAtCycles = [2, 1];
3657 let NumMicroOps = 3;
3659 def : InstRW<[SPRWriteResGroup379], (instrs VDIVPSZrr)>;
3661 def SPRWriteResGroup380 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
3663 let NumMicroOps = 2;
3665 def : InstRW<[SPRWriteResGroup380, ReadAfterVecLd], (instregex "^VDIVSHZrm_Int((k|kz)?)$")>;
3666 def : InstRW<[SPRWriteResGroup380, ReadAfterVecLd], (instrs VDIVSHZrm)>;
3668 def SPRWriteResGroup381 : SchedWriteRes<[SPRPort00]> {
3671 def : InstRW<[SPRWriteResGroup381], (instrs VDIVSHZrr_Int,
3674 def SPRWriteResGroup382 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3675 let ReleaseAtCycles = [2, 1, 2];
3677 let NumMicroOps = 5;
3679 def : InstRW<[SPRWriteResGroup382, ReadAfterVecXLd], (instregex "^VDPBF16PSZ128m((b|k|bk|kz)?)$")>;
3680 def : InstRW<[SPRWriteResGroup382, ReadAfterVecXLd], (instrs VDPBF16PSZ128mbkz)>;
3682 def SPRWriteResGroup383 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
3683 let ReleaseAtCycles = [2, 2];
3685 let NumMicroOps = 4;
3687 def : InstRW<[SPRWriteResGroup383], (instregex "^VDPBF16PSZ(128|256)r((k|kz)?)$")>;
3689 def SPRWriteResGroup384 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
3690 let ReleaseAtCycles = [2, 1, 2];
3692 let NumMicroOps = 5;
3694 def : InstRW<[SPRWriteResGroup384, ReadAfterVecYLd], (instregex "^VDPBF16PSZ256m((b|k|bk|kz)?)$")>;
3695 def : InstRW<[SPRWriteResGroup384, ReadAfterVecYLd], (instrs VDPBF16PSZ256mbkz)>;
3697 def SPRWriteResGroup385 : SchedWriteRes<[SPRPort00, SPRPort01, SPRPort02_03_11]> {
3698 let ReleaseAtCycles = [6, 7, 18];
3700 let NumMicroOps = 31;
3702 def : InstRW<[SPRWriteResGroup385], (instrs VERRm)>;
3704 def SPRWriteResGroup386 : SchedWriteRes<[SPRPort00, SPRPort01, SPRPort02_03_11]> {
3705 let ReleaseAtCycles = [6, 7, 17];
3707 let NumMicroOps = 30;
3709 def : InstRW<[SPRWriteResGroup386], (instrs VERRr)>;
3711 def SPRWriteResGroup387 : SchedWriteRes<[SPRPort00, SPRPort01, SPRPort02_03_11]> {
3712 let ReleaseAtCycles = [5, 8, 21];
3714 let NumMicroOps = 34;
3716 def : InstRW<[SPRWriteResGroup387], (instrs VERWm)>;
3718 def SPRWriteResGroup388 : SchedWriteRes<[SPRPort00, SPRPort01, SPRPort02_03_11]> {
3719 let ReleaseAtCycles = [5, 8, 20];
3721 let NumMicroOps = 33;
3723 def : InstRW<[SPRWriteResGroup388], (instrs VERWr)>;
3725 def SPRWriteResGroup389 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
3726 let ReleaseAtCycles = [1, 2];
3728 let NumMicroOps = 3;
3730 def : InstRW<[SPRWriteResGroup389, ReadAfterVecYLd], (instregex "^VEXPANDP(D|S)Z128rm((k|kz)?)$",
3731 "^VPEXPAND(B|D|Q|W)Z128rm$",
3732 "^VPEXPAND(D|Q)Z128rmk(z?)$")>;
3734 def SPRWriteResGroup390 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
3735 let ReleaseAtCycles = [2, 1];
3737 let NumMicroOps = 3;
3739 def : InstRW<[SPRWriteResGroup390], (instregex "^VF(C?)MADDCPHZ(128|256)m(b?)$",
3740 "^VROUNDP(D|S)Ym$")>;
3741 def : InstRW<[SPRWriteResGroup390, ReadAfterVecXLd], (instregex "^VF(C?)MADDCSHZm$",
3742 "^VF(C?)MULCPHZ128rm(b?)$",
3743 "^VF(C?)MULCSHZrm$",
3744 "^VRNDSCALEPHZ128rm(b?)i$",
3745 "^VRNDSCALESHZm((_Int)?)$",
3746 "^VSCALEFPHZ128rm(b?)$")>;
3747 def : InstRW<[SPRWriteResGroup390, ReadAfterVecYLd], (instregex "^VF(C?)MULCPHZ256rm(b?)$",
3748 "^VRNDSCALEP(D|H|S)Z256rm(b?)i$",
3749 "^VRNDSCALEP(D|S)Z256rm(b?)ik(z?)$",
3750 "^VSCALEFPHZ256rm(b?)$")>;
3751 def : InstRW<[SPRWriteResGroup390, ReadAfterVecLd], (instrs VSCALEFSHZrm)>;
3753 def SPRWriteResGroup391 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
3754 let ReleaseAtCycles = [2, 1];
3756 let NumMicroOps = 3;
3758 def : InstRW<[SPRWriteResGroup391], (instregex "^VF(C?)MADDCPHZ(128|256)m(bk|kz)$",
3759 "^VF(C?)MADDCPHZ(128|256)m(k|bkz)$")>;
3760 def : InstRW<[SPRWriteResGroup391, ReadAfterVecXLd], (instregex "^VF(C?)MADDCSHZmk(z?)$",
3761 "^VF(C?)MULCPHZ128rm(bk|kz)$",
3762 "^VF(C?)MULCPHZ128rm(k|bkz)$",
3763 "^VF(C?)MULCSHZrmk(z?)$")>;
3764 def : InstRW<[SPRWriteResGroup391, ReadAfterVecYLd], (instregex "^VF(C?)MULCPHZ256rm(bk|kz)$",
3765 "^VF(C?)MULCPHZ256rm(k|bkz)$")>;
3767 def SPRWriteResGroup392 : SchedWriteRes<[SPRPort00_01]> {
3768 let ReleaseAtCycles = [2];
3770 let NumMicroOps = 2;
3772 def : InstRW<[SPRWriteResGroup392], (instregex "^VF(C?)MADDCPHZ(128|256)r$",
3773 "^VF(C?)MADDCSHZr(b?)$",
3774 "^VF(C?)MULCPHZ(128|256)rr$",
3775 "^VF(C?)MULCSHZrr(b?)$",
3776 "^VRNDSCALEPHZ(128|256)rri$",
3777 "^VRNDSCALESHZr(b?)_Int$",
3778 "^VSCALEFPHZ(128|256)rr$")>;
3779 def : InstRW<[SPRWriteResGroup392], (instrs VRNDSCALESHZr,
3781 VSCALEFSHZrrb_Int)>;
3783 def SPRWriteResGroup393 : SchedWriteRes<[SPRPort00_01]> {
3784 let ReleaseAtCycles = [2];
3786 let NumMicroOps = 2;
3788 def : InstRW<[SPRWriteResGroup393], (instregex "^VF(C?)MADDCPHZ(128|256)rk(z?)$",
3789 "^VF(C?)MADDCSHZr(bk|kz)$",
3790 "^VF(C?)MADDCSHZr(k|bkz)$",
3791 "^VF(C?)MULCPHZ(128|256)rrk(z?)$",
3792 "^VF(C?)MULCSHZrr(bk|kz)$",
3793 "^VF(C?)MULCSHZrr(k|bkz)$")>;
3795 def SPRWriteResGroup394 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
3796 let ReleaseAtCycles = [2, 1];
3798 let NumMicroOps = 3;
3800 def : InstRW<[SPRWriteResGroup394], (instregex "^VF(C?)MADDCPHZm(b?)$")>;
3801 def : InstRW<[SPRWriteResGroup394, ReadAfterVecYLd], (instregex "^VF(C?)MULCPHZrm(b?)$",
3802 "^VRNDSCALEP(D|H|S)Zrm(b?)i$",
3803 "^VRNDSCALEP(D|S)Zrm(b?)ik(z?)$",
3804 "^VSCALEFPHZrm(b?)$")>;
3806 def SPRWriteResGroup395 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
3807 let ReleaseAtCycles = [2, 1];
3809 let NumMicroOps = 3;
3811 def : InstRW<[SPRWriteResGroup395], (instregex "^VF(C?)MADDCPHZm(bk|kz)$",
3812 "^VF(C?)MADDCPHZm(k|bkz)$")>;
3813 def : InstRW<[SPRWriteResGroup395, ReadAfterVecYLd], (instregex "^VF(C?)MULCPHZrm(bk|kz)$",
3814 "^VF(C?)MULCPHZrm(k|bkz)$")>;
3816 def SPRWriteResGroup396 : SchedWriteRes<[SPRPort00]> {
3817 let ReleaseAtCycles = [2];
3819 let NumMicroOps = 2;
3821 def : InstRW<[SPRWriteResGroup396], (instregex "^VF(C?)MADDCPHZr(b?)$",
3822 "^VF(C?)MULCPHZrr(b?)$",
3823 "^VRNDSCALEPHZrri(b?)$",
3824 "^VSCALEFPHZrr(b?)$")>;
3826 def SPRWriteResGroup397 : SchedWriteRes<[SPRPort00]> {
3827 let ReleaseAtCycles = [2];
3829 let NumMicroOps = 2;
3831 def : InstRW<[SPRWriteResGroup397], (instregex "^VF(C?)MADDCPHZr(bk|kz)$",
3832 "^VF(C?)MADDCPHZr(k|bkz)$",
3833 "^VF(C?)MULCPHZrr(bk|kz)$",
3834 "^VF(C?)MULCPHZrr(k|bkz)$")>;
3836 def SPRWriteResGroup398 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11]> {
3837 let ReleaseAtCycles = [1, 1, 2, 4];
3839 let NumMicroOps = 8;
3841 def : InstRW<[SPRWriteResGroup398, WriteVecMaskedGatherWriteback], (instregex "^VGATHER(D|Q)PDYrm$",
3842 "^VPGATHER(D|Q)QYrm$")>;
3843 def : InstRW<[SPRWriteResGroup398, WriteVecMaskedGatherWriteback], (instrs VGATHERQPSYrm,
3846 def SPRWriteResGroup399 : SchedWriteRes<[SPRPort00, SPRPort01_05, SPRPort02_03_11]> {
3847 let ReleaseAtCycles = [1, 1, 2];
3849 let NumMicroOps = 4;
3851 def : InstRW<[SPRWriteResGroup399, WriteVecMaskedGatherWriteback], (instregex "^VGATHER(D|Q)PDZ128rm$",
3852 "^VPGATHER(D|Q)QZ128rm$")>;
3853 def : InstRW<[SPRWriteResGroup399, WriteVecMaskedGatherWriteback], (instrs VGATHERQPSZ128rm,
3856 def SPRWriteResGroup400 : SchedWriteRes<[SPRPort00, SPRPort01_05, SPRPort02_03_11]> {
3857 let ReleaseAtCycles = [1, 2, 4];
3859 let NumMicroOps = 7;
3861 def : InstRW<[SPRWriteResGroup400, WriteVecMaskedGatherWriteback], (instregex "^VGATHER(D|Q)PDZ256rm$",
3862 "^VPGATHER(D|Q)QZ256rm$")>;
3863 def : InstRW<[SPRWriteResGroup400, WriteVecMaskedGatherWriteback], (instrs VGATHERQPSZ256rm,
3866 def SPRWriteResGroup401 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
3867 let ReleaseAtCycles = [1, 8, 2];
3869 let NumMicroOps = 11;
3871 def : InstRW<[SPRWriteResGroup401, WriteVecMaskedGatherWriteback], (instregex "^VGATHER(D|Q)PDZrm$",
3872 "^VPGATHER(D|Q)QZrm$")>;
3873 def : InstRW<[SPRWriteResGroup401, WriteVecMaskedGatherWriteback], (instrs VGATHERQPSZrm,
3876 def SPRWriteResGroup402 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11]> {
3877 let ReleaseAtCycles = [1, 1, 1, 2];
3879 let NumMicroOps = 5;
3881 def : InstRW<[SPRWriteResGroup402, WriteVecMaskedGatherWriteback], (instregex "^VGATHER(D|Q)PDrm$",
3882 "^VPGATHER(D|Q)Qrm$")>;
3883 def : InstRW<[SPRWriteResGroup402, WriteVecMaskedGatherWriteback], (instrs VGATHERQPSrm,
3886 def SPRWriteResGroup403 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11]> {
3887 let ReleaseAtCycles = [1, 1, 2, 8];
3889 let NumMicroOps = 12;
3891 def : InstRW<[SPRWriteResGroup403, WriteVecMaskedGatherWriteback], (instrs VGATHERDPSYrm,
3894 def SPRWriteResGroup404 : SchedWriteRes<[SPRPort00, SPRPort01_05, SPRPort02_03_11]> {
3895 let ReleaseAtCycles = [1, 2, 4];
3897 let NumMicroOps = 7;
3899 def : InstRW<[SPRWriteResGroup404, WriteVecMaskedGatherWriteback], (instrs VGATHERDPSZ128rm,
3902 def SPRWriteResGroup405 : SchedWriteRes<[SPRPort00, SPRPort01_05, SPRPort02_03_11]> {
3903 let ReleaseAtCycles = [1, 2, 8];
3905 let NumMicroOps = 11;
3907 def : InstRW<[SPRWriteResGroup405, WriteVecMaskedGatherWriteback], (instrs VGATHERDPSZ256rm,
3910 def SPRWriteResGroup406 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
3911 let ReleaseAtCycles = [1, 16, 2];
3913 let NumMicroOps = 19;
3915 def : InstRW<[SPRWriteResGroup406, WriteVecMaskedGatherWriteback], (instrs VGATHERDPSZrm,
3918 def SPRWriteResGroup407 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11]> {
3919 let ReleaseAtCycles = [1, 1, 2, 4];
3921 let NumMicroOps = 8;
3923 def : InstRW<[SPRWriteResGroup407, WriteVecMaskedGatherWriteback], (instrs VGATHERDPSrm,
3926 def SPRWriteResGroup408 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
3928 let NumMicroOps = 2;
3930 def : InstRW<[SPRWriteResGroup408, ReadAfterVecXLd], (instregex "^VGF2P8AFFINE((INV)?)QBZ128rm(b?)ik(z?)$",
3931 "^VGF2P8MULBZ128rmk(z?)$")>;
3932 def : InstRW<[SPRWriteResGroup408, ReadAfterVecYLd], (instregex "^VGF2P8AFFINE((INV)?)QBZ256rm(b?)ik(z?)$",
3933 "^VGF2P8MULBZ256rmk(z?)$")>;
3935 def SPRWriteResGroup409 : SchedWriteRes<[SPRPort00_01]> {
3938 def : InstRW<[SPRWriteResGroup409], (instregex "^VGF2P8AFFINE((INV)?)QBZ(128|256)rrik$",
3939 "^VGF2P8MULBZ(128|256)rrk$")>;
3941 def SPRWriteResGroup410 : SchedWriteRes<[SPRPort00_01]> {
3944 def : InstRW<[SPRWriteResGroup410], (instregex "^VGF2P8AFFINE((INV)?)QBZ(128|256)rrikz$",
3945 "^VGF2P8MULBZ(128|256)rrkz$")>;
3947 def SPRWriteResGroup411 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
3949 let NumMicroOps = 2;
3951 def : InstRW<[SPRWriteResGroup411, ReadAfterVecYLd], (instregex "^VGF2P8AFFINE((INV)?)QBZrm(b?)ik(z?)$",
3952 "^VGF2P8MULBZrmk(z?)$")>;
3954 def SPRWriteResGroup412 : SchedWriteRes<[SPRPort00]> {
3957 def : InstRW<[SPRWriteResGroup412], (instregex "^VGF2P8AFFINE((INV)?)QBZrrik$")>;
3958 def : InstRW<[SPRWriteResGroup412], (instrs VGF2P8MULBZrrk)>;
3960 def SPRWriteResGroup413 : SchedWriteRes<[SPRPort00]> {
3963 def : InstRW<[SPRWriteResGroup413], (instregex "^VGF2P8AFFINE((INV)?)QBZrrikz$")>;
3964 def : InstRW<[SPRWriteResGroup413], (instrs VGF2P8MULBZrrkz)>;
3966 def SPRWriteResGroup414 : SchedWriteRes<[SPRPort01_05, SPRPort05]> {
3967 let ReleaseAtCycles = [1, 2];
3969 let NumMicroOps = 3;
3971 def : InstRW<[SPRWriteResGroup414], (instregex "^VH(ADD|SUB)P(D|S)rr$")>;
3973 def SPRWriteResGroup415 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort02_03_11]> {
3975 let NumMicroOps = 3;
3977 def : InstRW<[SPRWriteResGroup415], (instrs VLDMXCSR)>;
3979 def SPRWriteResGroup416 : SchedWriteRes<[SPRPort01, SPRPort01_05, SPRPort02_03, SPRPort02_03_11, SPRPort04, SPRPort04_09, SPRPort05, SPRPort06]> {
3980 let ReleaseAtCycles = [1, 1, 1, 8, 1, 1, 2, 3];
3982 let NumMicroOps = 18;
3984 def : InstRW<[SPRWriteResGroup416], (instrs VMCLEARm)>;
3986 def SPRWriteResGroup417 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11]> {
3988 let NumMicroOps = 2;
3990 def : InstRW<[SPRWriteResGroup417], (instregex "^VMOVDQU(8|16)Z(128|256)rmk(z?)$",
3991 "^VMOVSHZrmk(z?)$")>;
3992 def : InstRW<[SPRWriteResGroup417, ReadAfterVecXLd], (instregex "^VP(ADD|SUB)(B|W)Z128rmk(z?)$",
3993 "^VPBLENDM(B|W)Z128rmk(z?)$")>;
3994 def : InstRW<[SPRWriteResGroup417, ReadAfterVecYLd], (instregex "^VP(ADD|SUB)(B|W)Z256rmk(z?)$",
3995 "^VPBLENDM(B|W)Z256rmk(z?)$")>;
3997 def SPRWriteResGroup418 : SchedWriteRes<[SPRPort00_01_05]> {
4000 def : InstRW<[SPRWriteResGroup418], (instregex "^VMOVDQU(8|16)Z(128|256)rrk(z?)((_REV)?)$",
4001 "^VMOVSHZrrk(z?)((_REV)?)$",
4002 "^VP(ADD|SUB)(B|W)Z(128|256)rrk(z?)$",
4003 "^VPBLENDM(B|W)Z(128|256)rrk(z?)$",
4004 "^VPMOVM2(B|W)Z(128|256)rr$")>;
4006 def SPRWriteResGroup419 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
4007 let ReleaseAtCycles = [1, 2, 2];
4009 let NumMicroOps = 5;
4011 def : InstRW<[SPRWriteResGroup419], (instrs VMOVDQU8Zmrk)>;
4013 def SPRWriteResGroup420 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4015 let NumMicroOps = 2;
4017 def : InstRW<[SPRWriteResGroup420], (instrs VMOVNTDQZ128mr)>;
4019 def SPRWriteResGroup421 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4021 let NumMicroOps = 2;
4023 def : InstRW<[SPRWriteResGroup421], (instrs VMOVNTDQZ256mr,
4026 def SPRWriteResGroup422 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4028 let NumMicroOps = 2;
4030 def : InstRW<[SPRWriteResGroup422], (instregex "^VMOVNT(PD|DQZ)mr$")>;
4032 def SPRWriteResGroup423 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4034 let NumMicroOps = 2;
4036 def : InstRW<[SPRWriteResGroup423], (instrs VMOVNTDQmr)>;
4038 def SPRWriteResGroup424 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4040 let NumMicroOps = 2;
4042 def : InstRW<[SPRWriteResGroup424], (instrs VMOVNTPDZ128mr)>;
4044 def SPRWriteResGroup425 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4046 let NumMicroOps = 2;
4048 def : InstRW<[SPRWriteResGroup425], (instrs VMOVNTPDZ256mr)>;
4050 def SPRWriteResGroup426 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4052 let NumMicroOps = 2;
4054 def : InstRW<[SPRWriteResGroup426], (instrs VMOVNTPDZmr)>;
4056 def SPRWriteResGroup427 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4058 let NumMicroOps = 2;
4060 def : InstRW<[SPRWriteResGroup427], (instrs VMOVNTPSYmr)>;
4062 def SPRWriteResGroup428 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4064 let NumMicroOps = 2;
4066 def : InstRW<[SPRWriteResGroup428], (instrs VMOVNTPSZ128mr)>;
4068 def SPRWriteResGroup429 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4070 let NumMicroOps = 2;
4072 def : InstRW<[SPRWriteResGroup429], (instrs VMOVNTPSZ256mr)>;
4074 def SPRWriteResGroup430 : SchedWriteRes<[SPRPort04_09, SPRPort07_08]> {
4076 let NumMicroOps = 2;
4078 def : InstRW<[SPRWriteResGroup430], (instrs VMOVNTPSZmr)>;
4080 def SPRWriteResGroup431 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4081 let ReleaseAtCycles = [3, 1, 8];
4083 let NumMicroOps = 12;
4085 def : InstRW<[SPRWriteResGroup431, ReadAfterVecXLd], (instregex "^VP2INTERSECTDZ128rm(b?)$")>;
4086 def : InstRW<[SPRWriteResGroup431, ReadAfterVecYLd], (instregex "^VP2INTERSECTQZ256rm(b?)$")>;
4088 def SPRWriteResGroup432 : SchedWriteRes<[SPRPort00_01_05, SPRPort05]> {
4089 let ReleaseAtCycles = [4, 8];
4091 let NumMicroOps = 12;
4093 def : InstRW<[SPRWriteResGroup432], (instrs VP2INTERSECTDZ128rr,
4094 VP2INTERSECTQZ256rr)>;
4096 def SPRWriteResGroup433 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort02_03_11, SPRPort05]> {
4097 let ReleaseAtCycles = [1, 8, 7, 2, 1, 11];
4099 let NumMicroOps = 30;
4101 def : InstRW<[SPRWriteResGroup433, ReadAfterVecYLd], (instregex "^VP2INTERSECTDZ256rm(b?)$")>;
4103 def SPRWriteResGroup434 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05, SPRPort01_05, SPRPort05]> {
4104 let ReleaseAtCycles = [1, 8, 8, 2, 11];
4106 let NumMicroOps = 30;
4108 def : InstRW<[SPRWriteResGroup434], (instrs VP2INTERSECTDZ256rr)>;
4110 def SPRWriteResGroup435 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4111 let ReleaseAtCycles = [13, 9, 1, 23];
4113 let NumMicroOps = 46;
4115 def : InstRW<[SPRWriteResGroup435, ReadAfterVecYLd], (instregex "^VP2INTERSECTDZrm(b?)$")>;
4117 def SPRWriteResGroup436 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort05]> {
4118 let ReleaseAtCycles = [13, 10, 23];
4120 let NumMicroOps = 46;
4122 def : InstRW<[SPRWriteResGroup436], (instrs VP2INTERSECTDZrr)>;
4124 def SPRWriteResGroup437 : SchedWriteRes<[SPRPort02_03_11, SPRPort05]> {
4125 let ReleaseAtCycles = [1, 4];
4127 let NumMicroOps = 5;
4129 def : InstRW<[SPRWriteResGroup437, ReadAfterVecXLd], (instregex "^VP2INTERSECTQZ128rm(b?)$")>;
4131 def SPRWriteResGroup438 : SchedWriteRes<[SPRPort05]> {
4132 let ReleaseAtCycles = [4];
4134 let NumMicroOps = 4;
4136 def : InstRW<[SPRWriteResGroup438], (instrs VP2INTERSECTQZ128rr)>;
4138 def SPRWriteResGroup439 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4139 let ReleaseAtCycles = [8, 7, 1, 14];
4141 let NumMicroOps = 30;
4143 def : InstRW<[SPRWriteResGroup439, ReadAfterVecYLd], (instregex "^VP2INTERSECTQZrm(b?)$")>;
4145 def SPRWriteResGroup440 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort05]> {
4146 let ReleaseAtCycles = [8, 8, 14];
4148 let NumMicroOps = 30;
4150 def : InstRW<[SPRWriteResGroup440], (instrs VP2INTERSECTQZrr)>;
4152 def SPRWriteResGroup441 : SchedWriteRes<[SPRPort00_01]> {
4155 def : InstRW<[SPRWriteResGroup441], (instregex "^VP(A|SU)BS(B|W)Z(128|256)rrk(z?)$",
4156 "^VPADD(U?)S(B|W)Z(128|256)rrk(z?)$",
4157 "^VPAVG(B|W)Z(128|256)rrk(z?)$",
4158 "^VPM(AX|IN)(SB|UW)Z(128|256)rrk(z?)$",
4159 "^VPM(AX|IN)(SW|UB)Z(128|256)rrk(z?)$",
4160 "^VPSH(L|R)DVWZ(128|256)rk(z?)$",
4161 "^VPS(L|R)LVWZ(128|256)rrk(z?)$",
4162 "^VPS(L|R)LWZ(128|256)rik(z?)$",
4163 "^VPSRAVWZ(128|256)rrk(z?)$",
4164 "^VPSRAWZ(128|256)rik(z?)$",
4165 "^VPSUBUS(B|W)Z(128|256)rrk(z?)$")>;
4167 def SPRWriteResGroup442 : SchedWriteRes<[SPRPort01_05, SPRPort02_03_11]> {
4169 let NumMicroOps = 2;
4171 def : InstRW<[SPRWriteResGroup442, ReadAfterVecYLd], (instregex "^VSHUFP(D|S)Yrmi$",
4172 "^VSHUFP(D|S)Z256rm(bi|ik)$",
4173 "^VSHUFP(D|S)Z256rmbik(z?)$",
4174 "^VSHUFP(D|S)Z256rmi((kz)?)$")>;
4175 def : InstRW<[SPRWriteResGroup442, ReadAfterVecYLd], (instrs VPBLENDWYrmi)>;
4177 def SPRWriteResGroup443 : SchedWriteRes<[SPRPort00, SPRPort05]> {
4179 let NumMicroOps = 2;
4181 def : InstRW<[SPRWriteResGroup443], (instregex "^VPBROADCASTM(B2Q|W2D)Z(128|256)rr$",
4182 "^VPBROADCASTM(B2Q|W2D)Zrr$",
4183 "^VP(ERM|SRA)WZrrk(z?)$",
4184 "^VPSHUFBITQMBZ(128|256)rr$",
4185 "^VPS(L|R)LWZrrk(z?)$")>;
4186 def : InstRW<[SPRWriteResGroup443], (instrs VPSHUFBITQMBZrr)>;
4188 def SPRWriteResGroup444 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort04_09, SPRPort05, SPRPort07_08]> {
4189 let ReleaseAtCycles = [1, 1, 1, 2, 1];
4191 let NumMicroOps = 6;
4193 def : InstRW<[SPRWriteResGroup444], (instregex "^VPCOMPRESS(B|W)Z(128|256)mr$")>;
4194 def : InstRW<[SPRWriteResGroup444], (instrs VPCOMPRESSWZmr)>;
4196 def SPRWriteResGroup445 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort04_09, SPRPort05, SPRPort07_08]> {
4197 let ReleaseAtCycles = [1, 1, 1, 2, 1];
4199 let NumMicroOps = 6;
4201 def : InstRW<[SPRWriteResGroup445], (instregex "^VPCOMPRESS(B|W)Z(128|256)mrk$")>;
4202 def : InstRW<[SPRWriteResGroup445], (instrs VPCOMPRESSWZmrk)>;
4204 def SPRWriteResGroup446 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort04_09, SPRPort05, SPRPort07_08]> {
4205 let ReleaseAtCycles = [1, 1, 2, 2, 2];
4207 let NumMicroOps = 8;
4209 def : InstRW<[SPRWriteResGroup446], (instrs VPCOMPRESSBZmr)>;
4211 def SPRWriteResGroup447 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort04_09, SPRPort05, SPRPort07_08]> {
4212 let ReleaseAtCycles = [1, 1, 2, 2, 2];
4214 let NumMicroOps = 8;
4216 def : InstRW<[SPRWriteResGroup447], (instrs VPCOMPRESSBZmrk)>;
4218 def SPRWriteResGroup448 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4219 let ReleaseAtCycles = [5, 4, 1, 5];
4221 let NumMicroOps = 15;
4223 def : InstRW<[SPRWriteResGroup448], (instregex "^VPCONFLICTDZ128rm((b|k|bk|kz)?)$")>;
4224 def : InstRW<[SPRWriteResGroup448], (instrs VPCONFLICTDZ128rmbkz)>;
4226 def SPRWriteResGroup449 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort05]> {
4227 let ReleaseAtCycles = [5, 5, 5];
4229 let NumMicroOps = 15;
4231 def : InstRW<[SPRWriteResGroup449], (instregex "^VPCONFLICTDZ128rr((k|kz)?)$")>;
4233 def SPRWriteResGroup450 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
4234 let ReleaseAtCycles = [7, 5, 1, 1, 9];
4236 let NumMicroOps = 23;
4238 def : InstRW<[SPRWriteResGroup450], (instregex "^VPCONFLICTDZ256rm((b|k|bk|kz)?)$")>;
4239 def : InstRW<[SPRWriteResGroup450], (instrs VPCONFLICTDZ256rmbkz)>;
4241 def SPRWriteResGroup451 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort00_06, SPRPort05]> {
4242 let ReleaseAtCycles = [7, 6, 1, 9];
4244 let NumMicroOps = 23;
4246 def : InstRW<[SPRWriteResGroup451], (instregex "^VPCONFLICTDZ256rr((k|kz)?)$")>;
4248 def SPRWriteResGroup452 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4249 let ReleaseAtCycles = [11, 8, 1, 17];
4251 let NumMicroOps = 37;
4253 def : InstRW<[SPRWriteResGroup452], (instregex "^VPCONFLICTDZrm((b|k|bk|kz)?)$")>;
4254 def : InstRW<[SPRWriteResGroup452], (instrs VPCONFLICTDZrmbkz)>;
4256 def SPRWriteResGroup453 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort05]> {
4257 let ReleaseAtCycles = [11, 9, 17];
4259 let NumMicroOps = 37;
4261 def : InstRW<[SPRWriteResGroup453], (instregex "^VPCONFLICTDZrr((kz)?)$")>;
4263 def SPRWriteResGroup454 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort05]> {
4264 let ReleaseAtCycles = [11, 9, 17];
4266 let NumMicroOps = 37;
4268 def : InstRW<[SPRWriteResGroup454], (instrs VPCONFLICTDZrrk)>;
4270 def SPRWriteResGroup455 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4271 let ReleaseAtCycles = [1, 1, 2];
4273 let NumMicroOps = 4;
4275 def : InstRW<[SPRWriteResGroup455], (instregex "^VPCONFLICTQZ128rm((b|k|bk|kz)?)$")>;
4276 def : InstRW<[SPRWriteResGroup455], (instrs VPCONFLICTQZ128rmbkz)>;
4277 def : InstRW<[SPRWriteResGroup455, ReadAfterVecYLd], (instregex "^VPERM(I|T)2BZ128rm$")>;
4279 def SPRWriteResGroup456 : SchedWriteRes<[SPRPort00_01_05, SPRPort05]> {
4280 let ReleaseAtCycles = [1, 2];
4282 let NumMicroOps = 3;
4284 def : InstRW<[SPRWriteResGroup456], (instregex "^VPCONFLICTQZ128rr((k|kz)?)$")>;
4286 def SPRWriteResGroup457 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4287 let ReleaseAtCycles = [5, 4, 1, 5];
4289 let NumMicroOps = 15;
4291 def : InstRW<[SPRWriteResGroup457], (instregex "^VPCONFLICTQZ256rm((b|k|bk|kz)?)$")>;
4292 def : InstRW<[SPRWriteResGroup457], (instrs VPCONFLICTQZ256rmbkz)>;
4294 def SPRWriteResGroup458 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort05]> {
4295 let ReleaseAtCycles = [5, 5, 5];
4297 let NumMicroOps = 15;
4299 def : InstRW<[SPRWriteResGroup458], (instregex "^VPCONFLICTQZ256rr((k|kz)?)$")>;
4301 def SPRWriteResGroup459 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4302 let ReleaseAtCycles = [7, 5, 1, 9];
4304 let NumMicroOps = 22;
4306 def : InstRW<[SPRWriteResGroup459], (instregex "^VPCONFLICTQZrm((b|k|bk|kz)?)$")>;
4307 def : InstRW<[SPRWriteResGroup459], (instrs VPCONFLICTQZrmbkz)>;
4309 def SPRWriteResGroup460 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort05]> {
4310 let ReleaseAtCycles = [7, 6, 9];
4312 let NumMicroOps = 22;
4314 def : InstRW<[SPRWriteResGroup460], (instregex "^VPCONFLICTQZrr((kz)?)$")>;
4316 def SPRWriteResGroup461 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort05]> {
4317 let ReleaseAtCycles = [7, 6, 9];
4319 let NumMicroOps = 22;
4321 def : InstRW<[SPRWriteResGroup461], (instrs VPCONFLICTQZrrk)>;
4323 def SPRWriteResGroup462 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4324 let ReleaseAtCycles = [1, 1, 2];
4326 let NumMicroOps = 4;
4328 def : InstRW<[SPRWriteResGroup462, ReadAfterVecYLd], (instregex "^VPERM(I|T)2BZ128rmk(z?)$")>;
4329 def : InstRW<[SPRWriteResGroup462, ReadAfterVecYLd], (instrs VPERMT2WZ128rm)>;
4331 def SPRWriteResGroup463 : SchedWriteRes<[SPRPort00_01_05, SPRPort05]> {
4332 let ReleaseAtCycles = [1, 2];
4334 let NumMicroOps = 3;
4336 def : InstRW<[SPRWriteResGroup463], (instregex "^VPERM(I|T)2BZ(128|256)rr$")>;
4338 def SPRWriteResGroup464 : SchedWriteRes<[SPRPort00_01_05, SPRPort05]> {
4339 let ReleaseAtCycles = [1, 2];
4341 let NumMicroOps = 3;
4343 def : InstRW<[SPRWriteResGroup464], (instregex "^VPERM(I|T)2BZ(128|256)rrk(z?)$",
4344 "^VPERM(I|T)2WZ(128|256)rr$")>;
4346 def SPRWriteResGroup465 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4347 let ReleaseAtCycles = [1, 1, 2];
4349 let NumMicroOps = 4;
4351 def : InstRW<[SPRWriteResGroup465, ReadAfterVecYLd], (instregex "^VPERM(I|T)2BZ256rm$")>;
4353 def SPRWriteResGroup466 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4354 let ReleaseAtCycles = [1, 1, 2];
4356 let NumMicroOps = 4;
4358 def : InstRW<[SPRWriteResGroup466, ReadAfterVecYLd], (instregex "^VPERM(I|T)2BZ256rmk(z?)$")>;
4359 def : InstRW<[SPRWriteResGroup466, ReadAfterVecYLd], (instrs VPERMI2WZ128rm,
4362 def SPRWriteResGroup467 : SchedWriteRes<[SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4363 let ReleaseAtCycles = [1, 1, 2];
4365 let NumMicroOps = 4;
4367 def : InstRW<[SPRWriteResGroup467, ReadAfterVecYLd], (instregex "^VPERM(I|T)2BZrm$")>;
4369 def SPRWriteResGroup468 : SchedWriteRes<[SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4370 let ReleaseAtCycles = [1, 1, 2];
4372 let NumMicroOps = 4;
4374 def : InstRW<[SPRWriteResGroup468, ReadAfterVecYLd], (instregex "^VPERM(I|T)2BZrmk(z?)$")>;
4375 def : InstRW<[SPRWriteResGroup468, ReadAfterVecYLd], (instrs VPERMT2WZrm)>;
4377 def SPRWriteResGroup469 : SchedWriteRes<[SPRPort00_05, SPRPort05]> {
4378 let ReleaseAtCycles = [1, 2];
4380 let NumMicroOps = 3;
4382 def : InstRW<[SPRWriteResGroup469], (instregex "^VPERM(I|T)2BZrr$")>;
4384 def SPRWriteResGroup470 : SchedWriteRes<[SPRPort00_05, SPRPort05]> {
4385 let ReleaseAtCycles = [1, 2];
4387 let NumMicroOps = 3;
4389 def : InstRW<[SPRWriteResGroup470], (instregex "^VPERM(I|T)2BZrrk(z?)$",
4390 "^VPERM(I|T)2WZrr$")>;
4392 def SPRWriteResGroup471 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4393 let ReleaseAtCycles = [1, 1, 2];
4395 let NumMicroOps = 4;
4397 def : InstRW<[SPRWriteResGroup471, ReadAfterVecYLd], (instregex "^VPERMI2WZ128rmk(z?)$",
4398 "^VPERMT2WZ256rmk(z?)$")>;
4400 def SPRWriteResGroup472 : SchedWriteRes<[SPRPort00_01_05, SPRPort05]> {
4401 let ReleaseAtCycles = [1, 2];
4403 let NumMicroOps = 3;
4405 def : InstRW<[SPRWriteResGroup472], (instregex "^VPERM(I|T)2WZ(128|256)rrk(z?)$")>;
4407 def SPRWriteResGroup473 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4408 let ReleaseAtCycles = [1, 1, 2];
4410 let NumMicroOps = 4;
4412 def : InstRW<[SPRWriteResGroup473, ReadAfterVecYLd], (instregex "^VPERMT2WZ128rmk(z?)$")>;
4413 def : InstRW<[SPRWriteResGroup473, ReadAfterVecYLd], (instrs VPERMI2WZ256rm)>;
4415 def SPRWriteResGroup474 : SchedWriteRes<[SPRPort00_01_05, SPRPort02_03_11, SPRPort05]> {
4416 let ReleaseAtCycles = [1, 1, 2];
4418 let NumMicroOps = 4;
4420 def : InstRW<[SPRWriteResGroup474, ReadAfterVecYLd], (instregex "^VPERMI2WZ256rmk(z?)$")>;
4422 def SPRWriteResGroup475 : SchedWriteRes<[SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4423 let ReleaseAtCycles = [1, 1, 2];
4425 let NumMicroOps = 4;
4427 def : InstRW<[SPRWriteResGroup475, ReadAfterVecYLd], (instrs VPERMI2WZrm)>;
4429 def SPRWriteResGroup476 : SchedWriteRes<[SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4430 let ReleaseAtCycles = [1, 1, 2];
4432 let NumMicroOps = 4;
4434 def : InstRW<[SPRWriteResGroup476, ReadAfterVecYLd], (instregex "^VPERMI2WZrmk(z?)$")>;
4436 def SPRWriteResGroup477 : SchedWriteRes<[SPRPort00_05, SPRPort05]> {
4437 let ReleaseAtCycles = [1, 2];
4439 let NumMicroOps = 3;
4441 def : InstRW<[SPRWriteResGroup477], (instregex "^VPERM(I|T)2WZrrk(z?)$")>;
4443 def SPRWriteResGroup478 : SchedWriteRes<[SPRPort00_05, SPRPort02_03_11, SPRPort05]> {
4444 let ReleaseAtCycles = [1, 1, 2];
4446 let NumMicroOps = 4;
4448 def : InstRW<[SPRWriteResGroup478, ReadAfterVecYLd], (instregex "^VPERMT2WZrmk(z?)$")>;
4450 def SPRWriteResGroup479 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
4452 let NumMicroOps = 3;
4454 def : InstRW<[SPRWriteResGroup479, ReadAfterVecYLd], (instrs VPERMWZ128rm)>;
4456 def SPRWriteResGroup480 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
4458 let NumMicroOps = 3;
4460 def : InstRW<[SPRWriteResGroup480, ReadAfterVecYLd], (instregex "^VPERMWZ(128|256)rmk(z?)$")>;
4462 def SPRWriteResGroup481 : SchedWriteRes<[SPRPort00_01, SPRPort05]> {
4464 let NumMicroOps = 2;
4466 def : InstRW<[SPRWriteResGroup481], (instregex "^VPERMWZ(128|256)rr$")>;
4468 def SPRWriteResGroup482 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11, SPRPort05]> {
4470 let NumMicroOps = 3;
4472 def : InstRW<[SPRWriteResGroup482, ReadAfterVecYLd], (instrs VPERMWZ256rm)>;
4474 def SPRWriteResGroup483 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
4476 let NumMicroOps = 3;
4478 def : InstRW<[SPRWriteResGroup483, ReadAfterVecYLd], (instrs VPERMWZrm)>;
4480 def SPRWriteResGroup484 : SchedWriteRes<[SPRPort05]> {
4481 let ReleaseAtCycles = [2];
4483 let NumMicroOps = 2;
4485 def : InstRW<[SPRWriteResGroup484], (instregex "^VPEXPAND(B|W)Z(128|256)rrk(z?)$",
4486 "^VPEXPAND(B|W)Zrrk(z?)$")>;
4488 def SPRWriteResGroup485 : SchedWriteRes<[SPRPort00_01, SPRPort01_05, SPRPort02_03_11]> {
4489 let ReleaseAtCycles = [1, 2, 1];
4491 let NumMicroOps = 4;
4493 def : InstRW<[SPRWriteResGroup485, ReadAfterVecYLd], (instregex "^VPH(ADD|SUB)SWYrm$")>;
4495 def SPRWriteResGroup486 : SchedWriteRes<[SPRPort00_01]> {
4498 def : InstRW<[SPRWriteResGroup486], (instregex "^VPMADDUBSWZ(128|256)rrk(z?)$",
4499 "^VPMULH((U|RS)?)WZ(128|256)rrk(z?)$",
4500 "^VPMULLWZ(128|256)rrk(z?)$")>;
4502 def SPRWriteResGroup487 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
4504 let NumMicroOps = 2;
4506 def : InstRW<[SPRWriteResGroup487, ReadAfterVecYLd], (instregex "^VPMADDUBSWZrmk(z?)$",
4507 "^VPMULH((U|RS)?)WZrmk(z?)$",
4508 "^VPMULLWZrmk(z?)$")>;
4510 def SPRWriteResGroup488 : SchedWriteRes<[SPRPort00]> {
4513 def : InstRW<[SPRWriteResGroup488], (instregex "^VPMADDUBSWZrrk(z?)$",
4514 "^VPMULH((U|RS)?)WZrrk(z?)$",
4515 "^VPMULLWZrrk(z?)$")>;
4517 def SPRWriteResGroup489 : SchedWriteRes<[SPRPort01_05, SPRPort04_09, SPRPort05, SPRPort07_08]> {
4519 let NumMicroOps = 4;
4521 def : InstRW<[SPRWriteResGroup489], (instregex "^VPMOV((US)?)DBZ(128|256)mr$",
4522 "^VPMOV((S|US)?)(D|Q)WZ(128|256)mr$",
4523 "^VPMOV(Q|W|SD|SW)BZ256mr$",
4524 "^VPMOV(W|SD)BZ128mr$",
4525 "^VPMOV(U?)SQBZ256mr$",
4526 "^VPMOV(U?)SQDZ(128|256)mr$",
4527 "^VPMOV(U?)SWBZ128mr$")>;
4528 def : InstRW<[SPRWriteResGroup489], (instrs VPMOVUSWBZ256mr)>;
4530 def SPRWriteResGroup490 : SchedWriteRes<[SPRPort01_05, SPRPort04_09, SPRPort05, SPRPort07_08]> {
4532 let NumMicroOps = 4;
4534 def : InstRW<[SPRWriteResGroup490], (instregex "^VPMOV(D|Q|W|SQ|SW)BZ128mrk$",
4535 "^VPMOV((S|US)?)(D|Q)WZ128mrk$",
4536 "^VPMOV(U?)S(DB|QD)Z128mrk$",
4537 "^VPMOVUS(Q|W)BZ128mrk$")>;
4539 def SPRWriteResGroup491 : SchedWriteRes<[SPRPort01_05, SPRPort05]> {
4541 let NumMicroOps = 2;
4543 def : InstRW<[SPRWriteResGroup491], (instregex "^VPMOV(D|Q|W|SQ|SW)BZ128rr$",
4544 "^VPMOV((S|US)?)(D|Q)WZ128rr$",
4545 "^VPMOV(U?)S(DB|QD)Z128rr$",
4546 "^VPMOV(U?)SQDZ128rrk(z?)$",
4547 "^VPMOVUS(Q|W)BZ128rr$")>;
4549 def SPRWriteResGroup492 : SchedWriteRes<[SPRPort01_05, SPRPort05]> {
4551 let NumMicroOps = 2;
4553 def : InstRW<[SPRWriteResGroup492], (instregex "^VPMOV(D|Q|W|SQ|SW)BZ128rrk(z?)$",
4554 "^VPMOV(D|Q|W|SQ|SW)BZ256rr$",
4555 "^VPMOV((S|US)?)(D|Q)WZ128rrk(z?)$",
4556 "^VPMOV((S|US)?)(D|Q)WZ256rr$",
4557 "^VPMOV(U?)SDBZ128rrk(z?)$",
4558 "^VPMOV(U?)S(DB|QD)Z256rr$",
4559 "^VPMOV(U?)SQDZ256rrk(z?)$",
4560 "^VPMOVUS(Q|W)BZ128rrk(z?)$",
4561 "^VPMOVUS(Q|W)BZ256rr$")>;
4563 def SPRWriteResGroup493 : SchedWriteRes<[SPRPort01_05, SPRPort04_09, SPRPort05, SPRPort07_08]> {
4565 let NumMicroOps = 4;
4567 def : InstRW<[SPRWriteResGroup493], (instregex "^VPMOV(D|Q|W|SQ|SW)BZ256mrk$",
4568 "^VPMOV((S|US)?)(D|Q)WZ256mrk$",
4569 "^VPMOV(U?)S(DB|QD)Z256mrk$",
4570 "^VPMOVUS(Q|W)BZ256mrk$")>;
4572 def SPRWriteResGroup494 : SchedWriteRes<[SPRPort01_05, SPRPort05]> {
4574 let NumMicroOps = 2;
4576 def : InstRW<[SPRWriteResGroup494], (instregex "^VPMOV(D|Q|W|SQ|SW)BZ256rrk(z?)$",
4577 "^VPMOV((S|US)?)(D|Q)WZ256rrk(z?)$",
4578 "^VPMOV(U?)SDBZ256rrk(z?)$",
4579 "^VPMOVUS(Q|W)BZ256rrk(z?)$")>;
4581 def SPRWriteResGroup495 : SchedWriteRes<[SPRPort01_05, SPRPort04_09, SPRPort05, SPRPort07_08]> {
4583 let NumMicroOps = 4;
4585 def : InstRW<[SPRWriteResGroup495], (instregex "^VPMOV((S|US)?)QBZ128mr$")>;
4587 def SPRWriteResGroup496 : SchedWriteRes<[SPRPort04_09, SPRPort05, SPRPort07_08]> {
4589 let NumMicroOps = 3;
4591 def : InstRW<[SPRWriteResGroup496], (instregex "^VPMOVQDZ((256)?)mrk$")>;
4593 def SPRWriteResGroup497 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
4594 let ReleaseAtCycles = [3, 1];
4596 let NumMicroOps = 4;
4598 def : InstRW<[SPRWriteResGroup497, ReadAfterVecXLd], (instregex "^VPMULLQZ128rm((b|k|bk|kz)?)$")>;
4599 def : InstRW<[SPRWriteResGroup497, ReadAfterVecXLd], (instrs VPMULLQZ128rmbkz)>;
4600 def : InstRW<[SPRWriteResGroup497, ReadAfterVecYLd], (instregex "^VPMULLQZ256rm((b|k|bk|kz)?)$")>;
4601 def : InstRW<[SPRWriteResGroup497, ReadAfterVecYLd], (instrs VPMULLQZ256rmbkz)>;
4603 def SPRWriteResGroup498 : SchedWriteRes<[SPRPort00_01]> {
4604 let ReleaseAtCycles = [3];
4606 let NumMicroOps = 3;
4608 def : InstRW<[SPRWriteResGroup498], (instregex "^VPMULLQZ(128|256)rr((k|kz)?)$")>;
4610 def SPRWriteResGroup499 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
4611 let ReleaseAtCycles = [3, 1];
4613 let NumMicroOps = 4;
4615 def : InstRW<[SPRWriteResGroup499, ReadAfterVecYLd], (instregex "^VPMULLQZrm((b|k|bk|kz)?)$")>;
4616 def : InstRW<[SPRWriteResGroup499, ReadAfterVecYLd], (instrs VPMULLQZrmbkz)>;
4618 def SPRWriteResGroup500 : SchedWriteRes<[SPRPort00]> {
4619 let ReleaseAtCycles = [3];
4621 let NumMicroOps = 3;
4623 def : InstRW<[SPRWriteResGroup500], (instregex "^VPMULLQZrr((k|kz)?)$")>;
4625 def SPRWriteResGroup501 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
4626 let ReleaseAtCycles = [1, 1, 1, 4, 4];
4628 let NumMicroOps = 11;
4630 def : InstRW<[SPRWriteResGroup501], (instregex "^VPSCATTER(D|Q)QZ256mr$",
4631 "^VSCATTER(D|Q)PDZ256mr$")>;
4632 def : InstRW<[SPRWriteResGroup501], (instrs VPSCATTERDDZ128mr,
4635 VSCATTERQPSZ256mr)>;
4637 def SPRWriteResGroup502 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
4638 let ReleaseAtCycles = [1, 1, 1, 8, 8];
4640 let NumMicroOps = 19;
4642 def : InstRW<[SPRWriteResGroup502], (instrs VPSCATTERDDZ256mr,
4643 VSCATTERDPSZ256mr)>;
4645 def SPRWriteResGroup503 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
4646 let ReleaseAtCycles = [2, 1, 16, 16];
4648 let NumMicroOps = 35;
4650 def : InstRW<[SPRWriteResGroup503], (instrs VPSCATTERDDZmr,
4653 def SPRWriteResGroup504 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
4654 let ReleaseAtCycles = [1, 1, 1, 2, 2];
4656 let NumMicroOps = 7;
4658 def : InstRW<[SPRWriteResGroup504], (instregex "^VPSCATTER(D|Q)QZ128mr$",
4659 "^VSCATTER(D|Q)PDZ128mr$")>;
4660 def : InstRW<[SPRWriteResGroup504], (instrs VPSCATTERQDZ128mr,
4661 VSCATTERQPSZ128mr)>;
4663 def SPRWriteResGroup505 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06_10, SPRPort04_09, SPRPort07_08]> {
4664 let ReleaseAtCycles = [2, 1, 8, 8];
4666 let NumMicroOps = 19;
4668 def : InstRW<[SPRWriteResGroup505], (instregex "^VPSCATTER(D|Q)QZmr$",
4669 "^VSCATTER(D|Q)PDZmr$")>;
4670 def : InstRW<[SPRWriteResGroup505], (instrs VPSCATTERQDZmr,
4673 def SPRWriteResGroup506 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
4675 let NumMicroOps = 2;
4677 def : InstRW<[SPRWriteResGroup506, ReadAfterVecXLd], (instregex "^VPSH(L|R)D(D|Q)Z128rmbi$",
4678 "^VPSH(L|R)D(D|Q|W)Z128rmi$",
4679 "^VPSH(L|R)DV(D|Q|W)Z128m$",
4680 "^VPSH(L|R)DV(D|Q)Z128m(b|k|kz)$",
4681 "^VPSH(L|R)DV(D|Q)Z128mbk(z?)$")>;
4683 def SPRWriteResGroup507 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort02_03_11]> {
4685 let NumMicroOps = 3;
4687 def : InstRW<[SPRWriteResGroup507, ReadAfterVecXLd], (instregex "^VPSH(L|R)D(D|Q)Z128rm(b?)ik(z?)$")>;
4689 def SPRWriteResGroup508 : SchedWriteRes<[SPRPort00_01]>;
4690 def : InstRW<[SPRWriteResGroup508], (instregex "^VPSH(L|R)D(D|Q|W)Z(128|256)rri$",
4691 "^VPSH(L|R)DV(D|Q|W)Z(128|256)r$",
4692 "^VPSH(L|R)DV(D|Q)Z(128|256)rk(z?)$")>;
4694 def SPRWriteResGroup509 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05]> {
4696 let NumMicroOps = 2;
4698 def : InstRW<[SPRWriteResGroup509], (instregex "^VPSH(L|R)D(D|Q)Z(128|256)rrik(z?)$")>;
4700 def SPRWriteResGroup510 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
4702 let NumMicroOps = 2;
4704 def : InstRW<[SPRWriteResGroup510, ReadAfterVecYLd], (instregex "^VPSH(L|R)D(D|Q)Z256rmbi$",
4705 "^VPSH(L|R)D(D|Q|W)Z256rmi$",
4706 "^VPSH(L|R)DV(D|Q|W)Z256m$",
4707 "^VPSH(L|R)DV(D|Q)Z256m(b|k|kz)$",
4708 "^VPSH(L|R)DV(D|Q)Z256mbk(z?)$")>;
4710 def SPRWriteResGroup511 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort02_03_11]> {
4712 let NumMicroOps = 3;
4714 def : InstRW<[SPRWriteResGroup511, ReadAfterVecYLd], (instregex "^VPSH(L|R)D(D|Q)Z256rm(b?)ik(z?)$")>;
4716 def SPRWriteResGroup512 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
4718 let NumMicroOps = 2;
4720 def : InstRW<[SPRWriteResGroup512, ReadAfterVecYLd], (instregex "^VPSH(L|R)D(D|Q)Zrmbi$",
4721 "^VPSH(L|R)D(D|Q|W)Zrmi$",
4722 "^VPSH(L|R)DV(D|Q|W)Zm$",
4723 "^VPSH(L|R)DV(D|Q)Zm(b|k|kz)$",
4724 "^VPSH(L|R)DV(D|Q)Zmbk(z?)$")>;
4726 def SPRWriteResGroup513 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11]> {
4728 let NumMicroOps = 3;
4730 def : InstRW<[SPRWriteResGroup513, ReadAfterVecYLd], (instregex "^VPSH(L|R)D(D|Q)Zrm(b?)ik(z?)$")>;
4732 def SPRWriteResGroup514 : SchedWriteRes<[SPRPort00, SPRPort00_05]> {
4734 let NumMicroOps = 2;
4736 def : InstRW<[SPRWriteResGroup514], (instregex "^VPSH(L|R)D(D|Q)Zrrik(z?)$")>;
4738 def SPRWriteResGroup515 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort02_03_11]> {
4740 let NumMicroOps = 3;
4742 def : InstRW<[SPRWriteResGroup515, ReadAfterVecXLd], (instregex "^VPSH(L|R)DWZ128rmik(z?)$")>;
4744 def SPRWriteResGroup516 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05]> {
4746 let NumMicroOps = 2;
4748 def : InstRW<[SPRWriteResGroup516], (instregex "^VPSH(L|R)DWZ(128|256)rrik(z?)$")>;
4750 def SPRWriteResGroup517 : SchedWriteRes<[SPRPort00_01, SPRPort00_01_05, SPRPort02_03_11]> {
4752 let NumMicroOps = 3;
4754 def : InstRW<[SPRWriteResGroup517, ReadAfterVecYLd], (instregex "^VPSH(L|R)DWZ256rmik(z?)$")>;
4756 def SPRWriteResGroup518 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11]> {
4758 let NumMicroOps = 3;
4760 def : InstRW<[SPRWriteResGroup518, ReadAfterVecYLd], (instregex "^VPSH(L|R)DWZrmik(z?)$")>;
4762 def SPRWriteResGroup519 : SchedWriteRes<[SPRPort00, SPRPort00_05]> {
4764 let NumMicroOps = 2;
4766 def : InstRW<[SPRWriteResGroup519], (instregex "^VPSH(L|R)DWZrrik(z?)$")>;
4768 def SPRWriteResGroup520 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
4770 let NumMicroOps = 3;
4772 def : InstRW<[SPRWriteResGroup520, ReadAfterVecXLd], (instrs VPSHUFBITQMBZ128rm)>;
4773 def : InstRW<[SPRWriteResGroup520, ReadAfterVecYLd], (instregex "^VPSHUFBITQMBZ((256)?)rm$")>;
4775 def SPRWriteResGroup521 : SchedWriteRes<[SPRPort00, SPRPort02_03_11, SPRPort05]> {
4777 let NumMicroOps = 3;
4779 def : InstRW<[SPRWriteResGroup521, ReadAfterVecXLd], (instrs VPSHUFBITQMBZ128rmk)>;
4780 def : InstRW<[SPRWriteResGroup521, ReadAfterVecYLd], (instregex "^VPSHUFBITQMBZ((256)?)rmk$")>;
4782 def SPRWriteResGroup522 : SchedWriteRes<[SPRPort00_01, SPRPort01_05]> {
4784 let NumMicroOps = 2;
4786 def : InstRW<[SPRWriteResGroup522], (instregex "^VPS(L|R)LWZ128rrk(z?)$",
4787 "^VPSRAWZ128rrk(z?)$")>;
4789 def SPRWriteResGroup523 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11]> {
4790 let ReleaseAtCycles = [2, 1, 1];
4792 let NumMicroOps = 4;
4794 def : InstRW<[SPRWriteResGroup523, ReadAfterVecYLd], (instregex "^VR(CP|SQRT)PHZm(bk|kz)$",
4795 "^VR(CP|SQRT)PHZm(k|bkz)$")>;
4797 def SPRWriteResGroup524 : SchedWriteRes<[SPRPort00, SPRPort00_05]> {
4798 let ReleaseAtCycles = [2, 1];
4800 let NumMicroOps = 3;
4802 def : InstRW<[SPRWriteResGroup524], (instregex "^VRCPPHZrk(z?)$")>;
4804 def SPRWriteResGroup525 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
4805 let ReleaseAtCycles = [3, 1];
4807 let NumMicroOps = 4;
4809 def : InstRW<[SPRWriteResGroup525, ReadAfterVecXLd], (instregex "^VREDUCEPHZ128rm(b?)i$")>;
4810 def : InstRW<[SPRWriteResGroup525, ReadAfterVecXLd], (instrs VREDUCESHZrmi)>;
4811 def : InstRW<[SPRWriteResGroup525, ReadAfterVecYLd], (instregex "^VREDUCEPHZ256rm(b?)i$")>;
4813 def SPRWriteResGroup526 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
4814 let ReleaseAtCycles = [3, 1];
4816 let NumMicroOps = 4;
4818 def : InstRW<[SPRWriteResGroup526, ReadAfterVecXLd], (instregex "^VREDUCEPHZ128rm(b?)ik(z?)$",
4819 "^VREDUCESHZrmik(z?)$")>;
4820 def : InstRW<[SPRWriteResGroup526, ReadAfterVecYLd], (instregex "^VREDUCEPHZ256rm(b?)ik(z?)$")>;
4822 def SPRWriteResGroup527 : SchedWriteRes<[SPRPort00_01]> {
4823 let ReleaseAtCycles = [3];
4825 let NumMicroOps = 3;
4827 def : InstRW<[SPRWriteResGroup527], (instregex "^VREDUCEPHZ(128|256)rri$",
4828 "^VREDUCESHZrri(b?)$")>;
4830 def SPRWriteResGroup528 : SchedWriteRes<[SPRPort00_01]> {
4831 let ReleaseAtCycles = [3];
4833 let NumMicroOps = 3;
4835 def : InstRW<[SPRWriteResGroup528], (instregex "^VREDUCEPHZ(128|256)rrik(z?)$",
4836 "^VREDUCESHZrri(bk|kz)$",
4837 "^VREDUCESHZrri(k|bkz)$")>;
4839 def SPRWriteResGroup529 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
4840 let ReleaseAtCycles = [3, 1];
4842 let NumMicroOps = 4;
4844 def : InstRW<[SPRWriteResGroup529, ReadAfterVecYLd], (instregex "^VREDUCEPHZrm(b?)i$")>;
4846 def SPRWriteResGroup530 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
4847 let ReleaseAtCycles = [3, 1];
4849 let NumMicroOps = 4;
4851 def : InstRW<[SPRWriteResGroup530, ReadAfterVecYLd], (instregex "^VREDUCEPHZrm(b?)ik(z?)$")>;
4853 def SPRWriteResGroup531 : SchedWriteRes<[SPRPort00]> {
4854 let ReleaseAtCycles = [3];
4856 let NumMicroOps = 3;
4858 def : InstRW<[SPRWriteResGroup531], (instregex "^VREDUCEPHZrri(b?)$")>;
4860 def SPRWriteResGroup532 : SchedWriteRes<[SPRPort00]> {
4861 let ReleaseAtCycles = [3];
4863 let NumMicroOps = 3;
4865 def : InstRW<[SPRWriteResGroup532], (instregex "^VREDUCEPHZrri(bk|kz)$",
4866 "^VREDUCEPHZrri(k|bkz)$")>;
4868 def SPRWriteResGroup533 : SchedWriteRes<[SPRPort00]> {
4869 let ReleaseAtCycles = [2];
4871 let NumMicroOps = 2;
4873 def : InstRW<[SPRWriteResGroup533], (instregex "^VRNDSCALEP(D|S)Zrri((b|k|bk|kz)?)$",
4874 "^VRNDSCALEP(D|S)Zrribkz$")>;
4876 def SPRWriteResGroup534 : SchedWriteRes<[SPRPort00_01, SPRPort02_03_11]> {
4877 let ReleaseAtCycles = [2, 1];
4879 let NumMicroOps = 3;
4881 def : InstRW<[SPRWriteResGroup534, ReadAfterVecXLd], (instregex "^VRNDSCALEPHZ128rm(b?)ik(z?)$",
4882 "^VRNDSCALESHZm_Intk(z?)$",
4883 "^VSCALEFPHZ128rm(bk|kz)$",
4884 "^VSCALEFPHZ128rm(k|bkz)$")>;
4885 def : InstRW<[SPRWriteResGroup534, ReadAfterVecYLd], (instregex "^VRNDSCALEPHZ256rm(b?)ik(z?)$",
4886 "^VSCALEFPHZ256rm(bk|kz)$",
4887 "^VSCALEFPHZ256rm(k|bkz)$")>;
4888 def : InstRW<[SPRWriteResGroup534, ReadAfterVecLd], (instregex "^VSCALEFSHZrmk(z?)$")>;
4890 def SPRWriteResGroup535 : SchedWriteRes<[SPRPort00_01]> {
4891 let ReleaseAtCycles = [2];
4893 let NumMicroOps = 2;
4895 def : InstRW<[SPRWriteResGroup535], (instregex "^VRNDSCALEPHZ(128|256)rrik(z?)$",
4896 "^VRNDSCALESHZr(b?)_Intk(z?)$",
4897 "^VSCALEFPHZ(128|256)rrk(z?)$",
4898 "^VSCALEFSHZrrb_Intk(z?)$",
4899 "^VSCALEFSHZrrk(z?)$")>;
4901 def SPRWriteResGroup536 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
4902 let ReleaseAtCycles = [2, 1];
4904 let NumMicroOps = 3;
4906 def : InstRW<[SPRWriteResGroup536, ReadAfterVecYLd], (instregex "^VRNDSCALEPHZrm(b?)ik(z?)$",
4907 "^VSCALEFPHZrm(bk|kz)$",
4908 "^VSCALEFPHZrm(k|bkz)$")>;
4910 def SPRWriteResGroup537 : SchedWriteRes<[SPRPort00]> {
4911 let ReleaseAtCycles = [2];
4913 let NumMicroOps = 2;
4915 def : InstRW<[SPRWriteResGroup537], (instregex "^VRNDSCALEPHZrri(bk|kz)$",
4916 "^VRNDSCALEPHZrri(k|bkz)$",
4917 "^VSCALEFPHZrr(bk|kz)$",
4918 "^VSCALEFPHZrr(k|bkz)$")>;
4920 def SPRWriteResGroup538 : SchedWriteRes<[SPRPort00, SPRPort00_05]> {
4921 let ReleaseAtCycles = [2, 1];
4923 let NumMicroOps = 3;
4925 def : InstRW<[SPRWriteResGroup538], (instregex "^VRSQRT14P(D|S)Zr$")>;
4926 def : InstRW<[SPRWriteResGroup538], (instrs VRSQRT14PSZrk,
4929 def SPRWriteResGroup539 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
4931 let NumMicroOps = 2;
4933 def : InstRW<[SPRWriteResGroup539], (instrs VSQRTPDYm)>;
4934 def : InstRW<[SPRWriteResGroup539, ReadAfterVecYLd], (instregex "^VSQRTPDZ256m(b?)$")>;
4936 def SPRWriteResGroup540 : SchedWriteRes<[SPRPort00, SPRPort02_03_11]> {
4938 let NumMicroOps = 2;
4940 def : InstRW<[SPRWriteResGroup540, ReadAfterVecXLd], (instregex "^VSQRTPDZ128m(bk|kz)$",
4941 "^VSQRTPDZ128m(k|bkz)$")>;
4942 def : InstRW<[SPRWriteResGroup540, ReadAfterVecLd], (instregex "^VSQRTSDZm_Intk(z?)$")>;
4944 def SPRWriteResGroup541 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11]> {
4945 let ReleaseAtCycles = [2, 1, 1];
4947 let NumMicroOps = 4;
4949 def : InstRW<[SPRWriteResGroup541, ReadAfterVecYLd], (instrs VSQRTPDZm)>;
4951 def SPRWriteResGroup542 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort02_03_11]> {
4952 let ReleaseAtCycles = [2, 1, 1];
4954 let NumMicroOps = 4;
4956 def : InstRW<[SPRWriteResGroup542, ReadAfterVecYLd], (instrs VSQRTPDZmb)>;
4958 def SPRWriteResGroup543 : SchedWriteRes<[SPRPort00, SPRPort00_05]> {
4959 let ReleaseAtCycles = [2, 1];
4961 let NumMicroOps = 3;
4963 def : InstRW<[SPRWriteResGroup543], (instrs VSQRTPDZr)>;
4965 def SPRWriteResGroup544 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort02_03_11]> {
4966 let ReleaseAtCycles = [2, 1, 1];
4968 let NumMicroOps = 4;
4970 def : InstRW<[SPRWriteResGroup544, ReadAfterVecXLd], (instregex "^VSQRTPHZ128m(bk|kz)$",
4971 "^VSQRTPHZ128m(k|bkz)$")>;
4973 def SPRWriteResGroup545 : SchedWriteRes<[SPRPort00, SPRPort00_01_05]> {
4974 let ReleaseAtCycles = [2, 1];
4976 let NumMicroOps = 3;
4978 def : InstRW<[SPRWriteResGroup545], (instregex "^VSQRTPHZ(128|256)rk$")>;
4979 def : InstRW<[SPRWriteResGroup545], (instrs VSQRTPHZ256rkz)>;
4981 def SPRWriteResGroup546 : SchedWriteRes<[SPRPort00, SPRPort00_01_05]> {
4982 let ReleaseAtCycles = [2, 1];
4984 let NumMicroOps = 3;
4986 def : InstRW<[SPRWriteResGroup546], (instrs VSQRTPHZ128rkz)>;
4988 def SPRWriteResGroup547 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort02_03_11]> {
4989 let ReleaseAtCycles = [2, 1, 1];
4991 let NumMicroOps = 4;
4993 def : InstRW<[SPRWriteResGroup547, ReadAfterVecYLd], (instregex "^VSQRTPHZ256m(b?)$")>;
4995 def SPRWriteResGroup548 : SchedWriteRes<[SPRPort00, SPRPort00_01_05, SPRPort02_03_11]> {
4996 let ReleaseAtCycles = [2, 1, 1];
4998 let NumMicroOps = 4;
5000 def : InstRW<[SPRWriteResGroup548, ReadAfterVecYLd], (instregex "^VSQRTPHZ256m(bk|kz)$",
5001 "^VSQRTPHZ256m(k|bkz)$")>;
5003 def SPRWriteResGroup549 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
5004 let ReleaseAtCycles = [4, 2, 1, 1, 1];
5006 let NumMicroOps = 9;
5008 def : InstRW<[SPRWriteResGroup549, ReadAfterVecYLd], (instregex "^VSQRTPHZm(b?)$")>;
5010 def SPRWriteResGroup550 : SchedWriteRes<[SPRPort00, SPRPort00_05, SPRPort00_06, SPRPort02_03_11, SPRPort05]> {
5011 let ReleaseAtCycles = [4, 2, 1, 1, 1];
5013 let NumMicroOps = 9;
5015 def : InstRW<[SPRWriteResGroup550, ReadAfterVecYLd], (instregex "^VSQRTPHZm(bk|kz)$",
5016 "^VSQRTPHZm(k|bkz)$")>;
5018 def SPRWriteResGroup551 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort05]> {
5019 let ReleaseAtCycles = [4, 1, 1];
5021 let NumMicroOps = 6;
5023 def : InstRW<[SPRWriteResGroup551], (instregex "^VSQRTPHZr(b?)$")>;
5025 def SPRWriteResGroup552 : SchedWriteRes<[SPRPort00, SPRPort00_06, SPRPort05]> {
5026 let ReleaseAtCycles = [4, 1, 1];
5028 let NumMicroOps = 6;
5030 def : InstRW<[SPRWriteResGroup552], (instregex "^VSQRTPHZr(bk|kz)$",
5031 "^VSQRTPHZr(k|bkz)$")>;
5033 def SPRWriteResGroup553 : SchedWriteRes<[SPRPort00, SPRPort00_05]> {
5034 let ReleaseAtCycles = [2, 1];
5036 let NumMicroOps = 3;
5038 def : InstRW<[SPRWriteResGroup553], (instrs VSQRTPSZr)>;
5040 def SPRWriteResGroup554 : SchedWriteRes<[SPRPort00_01_05, SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort01_05_10]> {
5041 let ReleaseAtCycles = [1, 2, 3, 3, 1];
5043 let NumMicroOps = 10;
5045 def : InstRW<[SPRWriteResGroup554], (instrs VZEROALL)>;
5047 def SPRWriteResGroup555 : SchedWriteRes<[SPRPort00_01_05_06]> {
5048 let ReleaseAtCycles = [2];
5050 let NumMicroOps = 2;
5052 def : InstRW<[SPRWriteResGroup555], (instrs WAIT)>;
5054 def SPRWriteResGroup556 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5055 let ReleaseAtCycles = [8, 6, 19, 63, 21, 15, 1, 10, 1];
5056 let Latency = SapphireRapidsModel.MaxLatency;
5057 let NumMicroOps = 144;
5059 def : InstRW<[SPRWriteResGroup556], (instrs WRMSR)>;
5061 def SPRWriteResGroup557 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06, SPRPort01, SPRPort05]> {
5062 let ReleaseAtCycles = [2, 1, 4, 1];
5063 let Latency = SapphireRapidsModel.MaxLatency;
5064 let NumMicroOps = 8;
5066 def : InstRW<[SPRWriteResGroup557], (instrs WRPKRUr)>;
5068 def SPRWriteResGroup558 : SchedWriteRes<[SPRPort00_01_05_06_10]> {
5069 let ReleaseAtCycles = [2];
5071 let NumMicroOps = 2;
5073 def : InstRW<[SPRWriteResGroup558, WriteRMW], (instregex "^XADD(16|32|64)rm$")>;
5075 def SPRWriteResGroup559 : SchedWriteRes<[SPRPort00_01_05_06_10]> {
5076 let ReleaseAtCycles = [2];
5078 let NumMicroOps = 2;
5080 def : InstRW<[SPRWriteResGroup559, WriteRMW], (instrs XADD8rm)>;
5082 def SPRWriteResGroup560 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06]> {
5083 let ReleaseAtCycles = [4, 1];
5085 let NumMicroOps = 5;
5087 def : InstRW<[SPRWriteResGroup560, WriteRMW], (instregex "^XCHG(16|32)rm$")>;
5089 def SPRWriteResGroup561 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06]> {
5090 let ReleaseAtCycles = [5, 1];
5092 let NumMicroOps = 6;
5094 def : InstRW<[SPRWriteResGroup561, WriteRMW], (instrs XCHG64rm)>;
5096 def SPRWriteResGroup562 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06]> {
5097 let ReleaseAtCycles = [4, 1];
5099 let NumMicroOps = 5;
5101 def : InstRW<[SPRWriteResGroup562, WriteRMW], (instrs XCHG8rm)>;
5103 def SPRWriteResGroup563 : SchedWriteRes<[SPRPort00, SPRPort00_01_05_06, SPRPort00_05, SPRPort01, SPRPort05, SPRPort06]> {
5104 let ReleaseAtCycles = [2, 4, 2, 1, 2, 4];
5106 let NumMicroOps = 15;
5108 def : InstRW<[SPRWriteResGroup563], (instrs XCH_F)>;
5110 def SPRWriteResGroup564 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_05_06, SPRPort00_06, SPRPort01]> {
5111 let ReleaseAtCycles = [7, 3, 8, 5];
5113 let NumMicroOps = 23;
5115 def : InstRW<[SPRWriteResGroup564], (instrs XGETBV)>;
5117 def SPRWriteResGroup565 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort02_03_11]> {
5118 let ReleaseAtCycles = [2, 1];
5120 let NumMicroOps = 3;
5122 def : InstRW<[SPRWriteResGroup565], (instrs XLAT)>;
5124 def SPRWriteResGroup566 : SchedWriteRes<[SPRPort01, SPRPort02_03, SPRPort02_03_11, SPRPort06]> {
5125 let ReleaseAtCycles = [1, 21, 1, 8];
5127 let NumMicroOps = 31;
5129 def : InstRW<[SPRWriteResGroup566], (instregex "^XRSTOR((S|64)?)$")>;
5130 def : InstRW<[SPRWriteResGroup566], (instrs XRSTORS64)>;
5132 def SPRWriteResGroup567 : SchedWriteRes<[SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5133 let ReleaseAtCycles = [14, 25, 44, 21, 21, 4, 1, 9, 1];
5135 let NumMicroOps = 140;
5137 def : InstRW<[SPRWriteResGroup567], (instrs XSAVE)>;
5139 def SPRWriteResGroup568 : SchedWriteRes<[SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5140 let ReleaseAtCycles = [14, 25, 44, 21, 21, 4, 1, 9, 1];
5142 let NumMicroOps = 140;
5144 def : InstRW<[SPRWriteResGroup568], (instrs XSAVE64)>;
5146 def SPRWriteResGroup569 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5147 let ReleaseAtCycles = [1, 19, 36, 52, 23, 4, 2, 12, 2];
5149 let NumMicroOps = 151;
5151 def : InstRW<[SPRWriteResGroup569], (instrs XSAVEC)>;
5153 def SPRWriteResGroup570 : SchedWriteRes<[SPRPort00, SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5154 let ReleaseAtCycles = [1, 19, 36, 53, 23, 4, 2, 12, 2];
5156 let NumMicroOps = 152;
5158 def : InstRW<[SPRWriteResGroup570], (instrs XSAVEC64)>;
5160 def SPRWriteResGroup571 : SchedWriteRes<[SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5161 let ReleaseAtCycles = [25, 35, 52, 27, 4, 1, 10, 1];
5163 let NumMicroOps = 155;
5165 def : InstRW<[SPRWriteResGroup571], (instrs XSAVEOPT)>;
5167 def SPRWriteResGroup572 : SchedWriteRes<[SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5168 let ReleaseAtCycles = [25, 35, 53, 27, 4, 1, 10, 1];
5170 let NumMicroOps = 156;
5172 def : InstRW<[SPRWriteResGroup572], (instrs XSAVEOPT64)>;
5174 def SPRWriteResGroup573 : SchedWriteRes<[SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5175 let ReleaseAtCycles = [23, 32, 53, 29, 30, 4, 2, 9, 2];
5177 let NumMicroOps = 184;
5179 def : InstRW<[SPRWriteResGroup573], (instrs XSAVES)>;
5181 def SPRWriteResGroup574 : SchedWriteRes<[SPRPort00_01, SPRPort00_05, SPRPort00_06, SPRPort01, SPRPort01_05, SPRPort02_03_11, SPRPort04_09, SPRPort05, SPRPort07_08]> {
5182 let ReleaseAtCycles = [23, 33, 53, 29, 32, 4, 2, 8, 2];
5184 let NumMicroOps = 186;
5186 def : InstRW<[SPRWriteResGroup574], (instrs XSAVES64)>;
5188 def SPRWriteResGroup575 : SchedWriteRes<[SPRPort00_01_05, SPRPort00_01_05_06_10, SPRPort00_05_06, SPRPort00_06, SPRPort01, SPRPort01_05_10, SPRPort05]> {
5189 let ReleaseAtCycles = [4, 23, 2, 14, 8, 1, 2];
5191 let NumMicroOps = 54;
5193 def : InstRW<[SPRWriteResGroup575], (instrs XSETBV)>;
5195 def SPRWriteResGroup576 : SchedWriteRes<[SPRPort00_01_05_06_10, SPRPort00_06]> {
5196 let ReleaseAtCycles = [2, 1];
5197 let Latency = SapphireRapidsModel.MaxLatency;
5198 let NumMicroOps = 3;
5200 def : InstRW<[SPRWriteResGroup576], (instrs XTEST)>;