[InstCombine] Signed saturation patterns
[llvm-core.git] / test / tools / llvm-mca / X86 / Barcelona / store-throughput.s
blob08a9c47302267da424f3210963824edfa28776ac
1 # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2 # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -scheduler-stats -dispatch-stats -iterations=100 -timeline -timeline-max-iterations=1 -noalias=true < %s | FileCheck %s
4 # LLVM-MCA-BEGIN
5 movb %spl, (%rax)
6 movb %bpl, (%rcx)
7 movb %sil, (%rdx)
8 movb %dil, (%rbx)
9 # LLVM-MCA-END
11 # LLVM-MCA-BEGIN
12 movw %sp, (%rax)
13 movw %bp, (%rcx)
14 movw %si, (%rdx)
15 movw %di, (%rbx)
16 # LLVM-MCA-END
18 # LLVM-MCA-BEGIN
19 movl %esp, (%rax)
20 movl %ebp, (%rcx)
21 movl %esi, (%rdx)
22 movl %edi, (%rbx)
23 # LLVM-MCA-END
25 # LLVM-MCA-BEGIN
26 movq %rsp, (%rax)
27 movq %rbp, (%rcx)
28 movq %rsi, (%rdx)
29 movq %rdi, (%rbx)
30 # LLVM-MCA-END
32 # LLVM-MCA-BEGIN
33 movd %mm0, (%rax)
34 movd %mm1, (%rcx)
35 movd %mm2, (%rdx)
36 movd %mm3, (%rbx)
37 # LLVM-MCA-END
39 # LLVM-MCA-BEGIN
40 movaps %xmm0, (%rax)
41 movaps %xmm1, (%rcx)
42 movaps %xmm2, (%rdx)
43 movaps %xmm3, (%rbx)
44 # LLVM-MCA-END
46 # CHECK: [0] Code Region
48 # CHECK: Iterations: 100
49 # CHECK-NEXT: Instructions: 400
50 # CHECK-NEXT: Total Cycles: 403
51 # CHECK-NEXT: Total uOps: 400
53 # CHECK: Dispatch Width: 4
54 # CHECK-NEXT: uOps Per Cycle: 0.99
55 # CHECK-NEXT: IPC: 0.99
56 # CHECK-NEXT: Block RThroughput: 4.0
58 # CHECK: Instruction Info:
59 # CHECK-NEXT: [1]: #uOps
60 # CHECK-NEXT: [2]: Latency
61 # CHECK-NEXT: [3]: RThroughput
62 # CHECK-NEXT: [4]: MayLoad
63 # CHECK-NEXT: [5]: MayStore
64 # CHECK-NEXT: [6]: HasSideEffects (U)
66 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
67 # CHECK-NEXT: 1 1 1.00 * movb %spl, (%rax)
68 # CHECK-NEXT: 1 1 1.00 * movb %bpl, (%rcx)
69 # CHECK-NEXT: 1 1 1.00 * movb %sil, (%rdx)
70 # CHECK-NEXT: 1 1 1.00 * movb %dil, (%rbx)
72 # CHECK: Dynamic Dispatch Stall Cycles:
73 # CHECK-NEXT: RAT - Register unavailable: 0
74 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
75 # CHECK-NEXT: SCHEDQ - Scheduler full: 329 (81.6%)
76 # CHECK-NEXT: LQ - Load queue full: 0
77 # CHECK-NEXT: SQ - Store queue full: 0
78 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
80 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
81 # CHECK-NEXT: [# dispatched], [# cycles]
82 # CHECK-NEXT: 0, 56 (13.9%)
83 # CHECK-NEXT: 1, 329 (81.6%)
84 # CHECK-NEXT: 3, 1 (0.2%)
85 # CHECK-NEXT: 4, 17 (4.2%)
87 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
88 # CHECK-NEXT: [# issued], [# cycles]
89 # CHECK-NEXT: 0, 3 (0.7%)
90 # CHECK-NEXT: 1, 400 (99.3%)
92 # CHECK: Scheduler's queue usage:
93 # CHECK-NEXT: [1] Resource name.
94 # CHECK-NEXT: [2] Average number of used buffer entries.
95 # CHECK-NEXT: [3] Maximum number of used buffer entries.
96 # CHECK-NEXT: [4] Total number of buffer entries.
98 # CHECK: [1] [2] [3] [4]
99 # CHECK-NEXT: SBPortAny 49 54 54
101 # CHECK: Resources:
102 # CHECK-NEXT: [0] - SBDivider
103 # CHECK-NEXT: [1] - SBFPDivider
104 # CHECK-NEXT: [2] - SBPort0
105 # CHECK-NEXT: [3] - SBPort1
106 # CHECK-NEXT: [4] - SBPort4
107 # CHECK-NEXT: [5] - SBPort5
108 # CHECK-NEXT: [6.0] - SBPort23
109 # CHECK-NEXT: [6.1] - SBPort23
111 # CHECK: Resource pressure per iteration:
112 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
113 # CHECK-NEXT: - - - - 4.00 - 2.00 2.00
115 # CHECK: Resource pressure by instruction:
116 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
117 # CHECK-NEXT: - - - - 1.00 - - 1.00 movb %spl, (%rax)
118 # CHECK-NEXT: - - - - 1.00 - 1.00 - movb %bpl, (%rcx)
119 # CHECK-NEXT: - - - - 1.00 - - 1.00 movb %sil, (%rdx)
120 # CHECK-NEXT: - - - - 1.00 - 1.00 - movb %dil, (%rbx)
122 # CHECK: Timeline view:
123 # CHECK-NEXT: Index 0123456
125 # CHECK: [0,0] DeER .. movb %spl, (%rax)
126 # CHECK-NEXT: [0,1] D=eER.. movb %bpl, (%rcx)
127 # CHECK-NEXT: [0,2] D==eER. movb %sil, (%rdx)
128 # CHECK-NEXT: [0,3] D===eER movb %dil, (%rbx)
130 # CHECK: Average Wait times (based on the timeline view):
131 # CHECK-NEXT: [0]: Executions
132 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
133 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
134 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
136 # CHECK: [0] [1] [2] [3]
137 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movb %spl, (%rax)
138 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 movb %bpl, (%rcx)
139 # CHECK-NEXT: 2. 1 3.0 0.0 0.0 movb %sil, (%rdx)
140 # CHECK-NEXT: 3. 1 4.0 0.0 0.0 movb %dil, (%rbx)
141 # CHECK-NEXT: 1 2.5 0.3 0.0 <total>
143 # CHECK: [1] Code Region
145 # CHECK: Iterations: 100
146 # CHECK-NEXT: Instructions: 400
147 # CHECK-NEXT: Total Cycles: 403
148 # CHECK-NEXT: Total uOps: 400
150 # CHECK: Dispatch Width: 4
151 # CHECK-NEXT: uOps Per Cycle: 0.99
152 # CHECK-NEXT: IPC: 0.99
153 # CHECK-NEXT: Block RThroughput: 4.0
155 # CHECK: Instruction Info:
156 # CHECK-NEXT: [1]: #uOps
157 # CHECK-NEXT: [2]: Latency
158 # CHECK-NEXT: [3]: RThroughput
159 # CHECK-NEXT: [4]: MayLoad
160 # CHECK-NEXT: [5]: MayStore
161 # CHECK-NEXT: [6]: HasSideEffects (U)
163 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
164 # CHECK-NEXT: 1 1 1.00 * movw %sp, (%rax)
165 # CHECK-NEXT: 1 1 1.00 * movw %bp, (%rcx)
166 # CHECK-NEXT: 1 1 1.00 * movw %si, (%rdx)
167 # CHECK-NEXT: 1 1 1.00 * movw %di, (%rbx)
169 # CHECK: Dynamic Dispatch Stall Cycles:
170 # CHECK-NEXT: RAT - Register unavailable: 0
171 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
172 # CHECK-NEXT: SCHEDQ - Scheduler full: 329 (81.6%)
173 # CHECK-NEXT: LQ - Load queue full: 0
174 # CHECK-NEXT: SQ - Store queue full: 0
175 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
177 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
178 # CHECK-NEXT: [# dispatched], [# cycles]
179 # CHECK-NEXT: 0, 56 (13.9%)
180 # CHECK-NEXT: 1, 329 (81.6%)
181 # CHECK-NEXT: 3, 1 (0.2%)
182 # CHECK-NEXT: 4, 17 (4.2%)
184 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
185 # CHECK-NEXT: [# issued], [# cycles]
186 # CHECK-NEXT: 0, 3 (0.7%)
187 # CHECK-NEXT: 1, 400 (99.3%)
189 # CHECK: Scheduler's queue usage:
190 # CHECK-NEXT: [1] Resource name.
191 # CHECK-NEXT: [2] Average number of used buffer entries.
192 # CHECK-NEXT: [3] Maximum number of used buffer entries.
193 # CHECK-NEXT: [4] Total number of buffer entries.
195 # CHECK: [1] [2] [3] [4]
196 # CHECK-NEXT: SBPortAny 49 54 54
198 # CHECK: Resources:
199 # CHECK-NEXT: [0] - SBDivider
200 # CHECK-NEXT: [1] - SBFPDivider
201 # CHECK-NEXT: [2] - SBPort0
202 # CHECK-NEXT: [3] - SBPort1
203 # CHECK-NEXT: [4] - SBPort4
204 # CHECK-NEXT: [5] - SBPort5
205 # CHECK-NEXT: [6.0] - SBPort23
206 # CHECK-NEXT: [6.1] - SBPort23
208 # CHECK: Resource pressure per iteration:
209 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
210 # CHECK-NEXT: - - - - 4.00 - 2.00 2.00
212 # CHECK: Resource pressure by instruction:
213 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
214 # CHECK-NEXT: - - - - 1.00 - - 1.00 movw %sp, (%rax)
215 # CHECK-NEXT: - - - - 1.00 - 1.00 - movw %bp, (%rcx)
216 # CHECK-NEXT: - - - - 1.00 - - 1.00 movw %si, (%rdx)
217 # CHECK-NEXT: - - - - 1.00 - 1.00 - movw %di, (%rbx)
219 # CHECK: Timeline view:
220 # CHECK-NEXT: Index 0123456
222 # CHECK: [0,0] DeER .. movw %sp, (%rax)
223 # CHECK-NEXT: [0,1] D=eER.. movw %bp, (%rcx)
224 # CHECK-NEXT: [0,2] D==eER. movw %si, (%rdx)
225 # CHECK-NEXT: [0,3] D===eER movw %di, (%rbx)
227 # CHECK: Average Wait times (based on the timeline view):
228 # CHECK-NEXT: [0]: Executions
229 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
230 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
231 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
233 # CHECK: [0] [1] [2] [3]
234 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movw %sp, (%rax)
235 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 movw %bp, (%rcx)
236 # CHECK-NEXT: 2. 1 3.0 0.0 0.0 movw %si, (%rdx)
237 # CHECK-NEXT: 3. 1 4.0 0.0 0.0 movw %di, (%rbx)
238 # CHECK-NEXT: 1 2.5 0.3 0.0 <total>
240 # CHECK: [2] Code Region
242 # CHECK: Iterations: 100
243 # CHECK-NEXT: Instructions: 400
244 # CHECK-NEXT: Total Cycles: 403
245 # CHECK-NEXT: Total uOps: 400
247 # CHECK: Dispatch Width: 4
248 # CHECK-NEXT: uOps Per Cycle: 0.99
249 # CHECK-NEXT: IPC: 0.99
250 # CHECK-NEXT: Block RThroughput: 4.0
252 # CHECK: Instruction Info:
253 # CHECK-NEXT: [1]: #uOps
254 # CHECK-NEXT: [2]: Latency
255 # CHECK-NEXT: [3]: RThroughput
256 # CHECK-NEXT: [4]: MayLoad
257 # CHECK-NEXT: [5]: MayStore
258 # CHECK-NEXT: [6]: HasSideEffects (U)
260 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
261 # CHECK-NEXT: 1 1 1.00 * movl %esp, (%rax)
262 # CHECK-NEXT: 1 1 1.00 * movl %ebp, (%rcx)
263 # CHECK-NEXT: 1 1 1.00 * movl %esi, (%rdx)
264 # CHECK-NEXT: 1 1 1.00 * movl %edi, (%rbx)
266 # CHECK: Dynamic Dispatch Stall Cycles:
267 # CHECK-NEXT: RAT - Register unavailable: 0
268 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
269 # CHECK-NEXT: SCHEDQ - Scheduler full: 329 (81.6%)
270 # CHECK-NEXT: LQ - Load queue full: 0
271 # CHECK-NEXT: SQ - Store queue full: 0
272 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
274 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
275 # CHECK-NEXT: [# dispatched], [# cycles]
276 # CHECK-NEXT: 0, 56 (13.9%)
277 # CHECK-NEXT: 1, 329 (81.6%)
278 # CHECK-NEXT: 3, 1 (0.2%)
279 # CHECK-NEXT: 4, 17 (4.2%)
281 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
282 # CHECK-NEXT: [# issued], [# cycles]
283 # CHECK-NEXT: 0, 3 (0.7%)
284 # CHECK-NEXT: 1, 400 (99.3%)
286 # CHECK: Scheduler's queue usage:
287 # CHECK-NEXT: [1] Resource name.
288 # CHECK-NEXT: [2] Average number of used buffer entries.
289 # CHECK-NEXT: [3] Maximum number of used buffer entries.
290 # CHECK-NEXT: [4] Total number of buffer entries.
292 # CHECK: [1] [2] [3] [4]
293 # CHECK-NEXT: SBPortAny 49 54 54
295 # CHECK: Resources:
296 # CHECK-NEXT: [0] - SBDivider
297 # CHECK-NEXT: [1] - SBFPDivider
298 # CHECK-NEXT: [2] - SBPort0
299 # CHECK-NEXT: [3] - SBPort1
300 # CHECK-NEXT: [4] - SBPort4
301 # CHECK-NEXT: [5] - SBPort5
302 # CHECK-NEXT: [6.0] - SBPort23
303 # CHECK-NEXT: [6.1] - SBPort23
305 # CHECK: Resource pressure per iteration:
306 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
307 # CHECK-NEXT: - - - - 4.00 - 2.00 2.00
309 # CHECK: Resource pressure by instruction:
310 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
311 # CHECK-NEXT: - - - - 1.00 - - 1.00 movl %esp, (%rax)
312 # CHECK-NEXT: - - - - 1.00 - 1.00 - movl %ebp, (%rcx)
313 # CHECK-NEXT: - - - - 1.00 - - 1.00 movl %esi, (%rdx)
314 # CHECK-NEXT: - - - - 1.00 - 1.00 - movl %edi, (%rbx)
316 # CHECK: Timeline view:
317 # CHECK-NEXT: Index 0123456
319 # CHECK: [0,0] DeER .. movl %esp, (%rax)
320 # CHECK-NEXT: [0,1] D=eER.. movl %ebp, (%rcx)
321 # CHECK-NEXT: [0,2] D==eER. movl %esi, (%rdx)
322 # CHECK-NEXT: [0,3] D===eER movl %edi, (%rbx)
324 # CHECK: Average Wait times (based on the timeline view):
325 # CHECK-NEXT: [0]: Executions
326 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
327 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
328 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
330 # CHECK: [0] [1] [2] [3]
331 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movl %esp, (%rax)
332 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 movl %ebp, (%rcx)
333 # CHECK-NEXT: 2. 1 3.0 0.0 0.0 movl %esi, (%rdx)
334 # CHECK-NEXT: 3. 1 4.0 0.0 0.0 movl %edi, (%rbx)
335 # CHECK-NEXT: 1 2.5 0.3 0.0 <total>
337 # CHECK: [3] Code Region
339 # CHECK: Iterations: 100
340 # CHECK-NEXT: Instructions: 400
341 # CHECK-NEXT: Total Cycles: 403
342 # CHECK-NEXT: Total uOps: 400
344 # CHECK: Dispatch Width: 4
345 # CHECK-NEXT: uOps Per Cycle: 0.99
346 # CHECK-NEXT: IPC: 0.99
347 # CHECK-NEXT: Block RThroughput: 4.0
349 # CHECK: Instruction Info:
350 # CHECK-NEXT: [1]: #uOps
351 # CHECK-NEXT: [2]: Latency
352 # CHECK-NEXT: [3]: RThroughput
353 # CHECK-NEXT: [4]: MayLoad
354 # CHECK-NEXT: [5]: MayStore
355 # CHECK-NEXT: [6]: HasSideEffects (U)
357 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
358 # CHECK-NEXT: 1 1 1.00 * movq %rsp, (%rax)
359 # CHECK-NEXT: 1 1 1.00 * movq %rbp, (%rcx)
360 # CHECK-NEXT: 1 1 1.00 * movq %rsi, (%rdx)
361 # CHECK-NEXT: 1 1 1.00 * movq %rdi, (%rbx)
363 # CHECK: Dynamic Dispatch Stall Cycles:
364 # CHECK-NEXT: RAT - Register unavailable: 0
365 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
366 # CHECK-NEXT: SCHEDQ - Scheduler full: 329 (81.6%)
367 # CHECK-NEXT: LQ - Load queue full: 0
368 # CHECK-NEXT: SQ - Store queue full: 0
369 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
371 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
372 # CHECK-NEXT: [# dispatched], [# cycles]
373 # CHECK-NEXT: 0, 56 (13.9%)
374 # CHECK-NEXT: 1, 329 (81.6%)
375 # CHECK-NEXT: 3, 1 (0.2%)
376 # CHECK-NEXT: 4, 17 (4.2%)
378 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
379 # CHECK-NEXT: [# issued], [# cycles]
380 # CHECK-NEXT: 0, 3 (0.7%)
381 # CHECK-NEXT: 1, 400 (99.3%)
383 # CHECK: Scheduler's queue usage:
384 # CHECK-NEXT: [1] Resource name.
385 # CHECK-NEXT: [2] Average number of used buffer entries.
386 # CHECK-NEXT: [3] Maximum number of used buffer entries.
387 # CHECK-NEXT: [4] Total number of buffer entries.
389 # CHECK: [1] [2] [3] [4]
390 # CHECK-NEXT: SBPortAny 49 54 54
392 # CHECK: Resources:
393 # CHECK-NEXT: [0] - SBDivider
394 # CHECK-NEXT: [1] - SBFPDivider
395 # CHECK-NEXT: [2] - SBPort0
396 # CHECK-NEXT: [3] - SBPort1
397 # CHECK-NEXT: [4] - SBPort4
398 # CHECK-NEXT: [5] - SBPort5
399 # CHECK-NEXT: [6.0] - SBPort23
400 # CHECK-NEXT: [6.1] - SBPort23
402 # CHECK: Resource pressure per iteration:
403 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
404 # CHECK-NEXT: - - - - 4.00 - 2.00 2.00
406 # CHECK: Resource pressure by instruction:
407 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
408 # CHECK-NEXT: - - - - 1.00 - - 1.00 movq %rsp, (%rax)
409 # CHECK-NEXT: - - - - 1.00 - 1.00 - movq %rbp, (%rcx)
410 # CHECK-NEXT: - - - - 1.00 - - 1.00 movq %rsi, (%rdx)
411 # CHECK-NEXT: - - - - 1.00 - 1.00 - movq %rdi, (%rbx)
413 # CHECK: Timeline view:
414 # CHECK-NEXT: Index 0123456
416 # CHECK: [0,0] DeER .. movq %rsp, (%rax)
417 # CHECK-NEXT: [0,1] D=eER.. movq %rbp, (%rcx)
418 # CHECK-NEXT: [0,2] D==eER. movq %rsi, (%rdx)
419 # CHECK-NEXT: [0,3] D===eER movq %rdi, (%rbx)
421 # CHECK: Average Wait times (based on the timeline view):
422 # CHECK-NEXT: [0]: Executions
423 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
424 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
425 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
427 # CHECK: [0] [1] [2] [3]
428 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movq %rsp, (%rax)
429 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 movq %rbp, (%rcx)
430 # CHECK-NEXT: 2. 1 3.0 0.0 0.0 movq %rsi, (%rdx)
431 # CHECK-NEXT: 3. 1 4.0 0.0 0.0 movq %rdi, (%rbx)
432 # CHECK-NEXT: 1 2.5 0.3 0.0 <total>
434 # CHECK: [4] Code Region
436 # CHECK: Iterations: 100
437 # CHECK-NEXT: Instructions: 400
438 # CHECK-NEXT: Total Cycles: 403
439 # CHECK-NEXT: Total uOps: 400
441 # CHECK: Dispatch Width: 4
442 # CHECK-NEXT: uOps Per Cycle: 0.99
443 # CHECK-NEXT: IPC: 0.99
444 # CHECK-NEXT: Block RThroughput: 4.0
446 # CHECK: Instruction Info:
447 # CHECK-NEXT: [1]: #uOps
448 # CHECK-NEXT: [2]: Latency
449 # CHECK-NEXT: [3]: RThroughput
450 # CHECK-NEXT: [4]: MayLoad
451 # CHECK-NEXT: [5]: MayStore
452 # CHECK-NEXT: [6]: HasSideEffects (U)
454 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
455 # CHECK-NEXT: 1 1 1.00 * U movd %mm0, (%rax)
456 # CHECK-NEXT: 1 1 1.00 * U movd %mm1, (%rcx)
457 # CHECK-NEXT: 1 1 1.00 * U movd %mm2, (%rdx)
458 # CHECK-NEXT: 1 1 1.00 * U movd %mm3, (%rbx)
460 # CHECK: Dynamic Dispatch Stall Cycles:
461 # CHECK-NEXT: RAT - Register unavailable: 0
462 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
463 # CHECK-NEXT: SCHEDQ - Scheduler full: 329 (81.6%)
464 # CHECK-NEXT: LQ - Load queue full: 0
465 # CHECK-NEXT: SQ - Store queue full: 0
466 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
468 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
469 # CHECK-NEXT: [# dispatched], [# cycles]
470 # CHECK-NEXT: 0, 56 (13.9%)
471 # CHECK-NEXT: 1, 329 (81.6%)
472 # CHECK-NEXT: 3, 1 (0.2%)
473 # CHECK-NEXT: 4, 17 (4.2%)
475 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
476 # CHECK-NEXT: [# issued], [# cycles]
477 # CHECK-NEXT: 0, 3 (0.7%)
478 # CHECK-NEXT: 1, 400 (99.3%)
480 # CHECK: Scheduler's queue usage:
481 # CHECK-NEXT: [1] Resource name.
482 # CHECK-NEXT: [2] Average number of used buffer entries.
483 # CHECK-NEXT: [3] Maximum number of used buffer entries.
484 # CHECK-NEXT: [4] Total number of buffer entries.
486 # CHECK: [1] [2] [3] [4]
487 # CHECK-NEXT: SBPortAny 49 54 54
489 # CHECK: Resources:
490 # CHECK-NEXT: [0] - SBDivider
491 # CHECK-NEXT: [1] - SBFPDivider
492 # CHECK-NEXT: [2] - SBPort0
493 # CHECK-NEXT: [3] - SBPort1
494 # CHECK-NEXT: [4] - SBPort4
495 # CHECK-NEXT: [5] - SBPort5
496 # CHECK-NEXT: [6.0] - SBPort23
497 # CHECK-NEXT: [6.1] - SBPort23
499 # CHECK: Resource pressure per iteration:
500 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
501 # CHECK-NEXT: - - - - 4.00 - 2.00 2.00
503 # CHECK: Resource pressure by instruction:
504 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
505 # CHECK-NEXT: - - - - 1.00 - - 1.00 movd %mm0, (%rax)
506 # CHECK-NEXT: - - - - 1.00 - 1.00 - movd %mm1, (%rcx)
507 # CHECK-NEXT: - - - - 1.00 - - 1.00 movd %mm2, (%rdx)
508 # CHECK-NEXT: - - - - 1.00 - 1.00 - movd %mm3, (%rbx)
510 # CHECK: Timeline view:
511 # CHECK-NEXT: Index 0123456
513 # CHECK: [0,0] DeER .. movd %mm0, (%rax)
514 # CHECK-NEXT: [0,1] D=eER.. movd %mm1, (%rcx)
515 # CHECK-NEXT: [0,2] D==eER. movd %mm2, (%rdx)
516 # CHECK-NEXT: [0,3] D===eER movd %mm3, (%rbx)
518 # CHECK: Average Wait times (based on the timeline view):
519 # CHECK-NEXT: [0]: Executions
520 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
521 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
522 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
524 # CHECK: [0] [1] [2] [3]
525 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movd %mm0, (%rax)
526 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 movd %mm1, (%rcx)
527 # CHECK-NEXT: 2. 1 3.0 0.0 0.0 movd %mm2, (%rdx)
528 # CHECK-NEXT: 3. 1 4.0 0.0 0.0 movd %mm3, (%rbx)
529 # CHECK-NEXT: 1 2.5 0.3 0.0 <total>
531 # CHECK: [5] Code Region
533 # CHECK: Iterations: 100
534 # CHECK-NEXT: Instructions: 400
535 # CHECK-NEXT: Total Cycles: 403
536 # CHECK-NEXT: Total uOps: 400
538 # CHECK: Dispatch Width: 4
539 # CHECK-NEXT: uOps Per Cycle: 0.99
540 # CHECK-NEXT: IPC: 0.99
541 # CHECK-NEXT: Block RThroughput: 4.0
543 # CHECK: Instruction Info:
544 # CHECK-NEXT: [1]: #uOps
545 # CHECK-NEXT: [2]: Latency
546 # CHECK-NEXT: [3]: RThroughput
547 # CHECK-NEXT: [4]: MayLoad
548 # CHECK-NEXT: [5]: MayStore
549 # CHECK-NEXT: [6]: HasSideEffects (U)
551 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
552 # CHECK-NEXT: 1 1 1.00 * movaps %xmm0, (%rax)
553 # CHECK-NEXT: 1 1 1.00 * movaps %xmm1, (%rcx)
554 # CHECK-NEXT: 1 1 1.00 * movaps %xmm2, (%rdx)
555 # CHECK-NEXT: 1 1 1.00 * movaps %xmm3, (%rbx)
557 # CHECK: Dynamic Dispatch Stall Cycles:
558 # CHECK-NEXT: RAT - Register unavailable: 0
559 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
560 # CHECK-NEXT: SCHEDQ - Scheduler full: 329 (81.6%)
561 # CHECK-NEXT: LQ - Load queue full: 0
562 # CHECK-NEXT: SQ - Store queue full: 0
563 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
565 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
566 # CHECK-NEXT: [# dispatched], [# cycles]
567 # CHECK-NEXT: 0, 56 (13.9%)
568 # CHECK-NEXT: 1, 329 (81.6%)
569 # CHECK-NEXT: 3, 1 (0.2%)
570 # CHECK-NEXT: 4, 17 (4.2%)
572 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
573 # CHECK-NEXT: [# issued], [# cycles]
574 # CHECK-NEXT: 0, 3 (0.7%)
575 # CHECK-NEXT: 1, 400 (99.3%)
577 # CHECK: Scheduler's queue usage:
578 # CHECK-NEXT: [1] Resource name.
579 # CHECK-NEXT: [2] Average number of used buffer entries.
580 # CHECK-NEXT: [3] Maximum number of used buffer entries.
581 # CHECK-NEXT: [4] Total number of buffer entries.
583 # CHECK: [1] [2] [3] [4]
584 # CHECK-NEXT: SBPortAny 49 54 54
586 # CHECK: Resources:
587 # CHECK-NEXT: [0] - SBDivider
588 # CHECK-NEXT: [1] - SBFPDivider
589 # CHECK-NEXT: [2] - SBPort0
590 # CHECK-NEXT: [3] - SBPort1
591 # CHECK-NEXT: [4] - SBPort4
592 # CHECK-NEXT: [5] - SBPort5
593 # CHECK-NEXT: [6.0] - SBPort23
594 # CHECK-NEXT: [6.1] - SBPort23
596 # CHECK: Resource pressure per iteration:
597 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
598 # CHECK-NEXT: - - - - 4.00 - 2.00 2.00
600 # CHECK: Resource pressure by instruction:
601 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
602 # CHECK-NEXT: - - - - 1.00 - - 1.00 movaps %xmm0, (%rax)
603 # CHECK-NEXT: - - - - 1.00 - 1.00 - movaps %xmm1, (%rcx)
604 # CHECK-NEXT: - - - - 1.00 - - 1.00 movaps %xmm2, (%rdx)
605 # CHECK-NEXT: - - - - 1.00 - 1.00 - movaps %xmm3, (%rbx)
607 # CHECK: Timeline view:
608 # CHECK-NEXT: Index 0123456
610 # CHECK: [0,0] DeER .. movaps %xmm0, (%rax)
611 # CHECK-NEXT: [0,1] D=eER.. movaps %xmm1, (%rcx)
612 # CHECK-NEXT: [0,2] D==eER. movaps %xmm2, (%rdx)
613 # CHECK-NEXT: [0,3] D===eER movaps %xmm3, (%rbx)
615 # CHECK: Average Wait times (based on the timeline view):
616 # CHECK-NEXT: [0]: Executions
617 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
618 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
619 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
621 # CHECK: [0] [1] [2] [3]
622 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movaps %xmm0, (%rax)
623 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 movaps %xmm1, (%rcx)
624 # CHECK-NEXT: 2. 1 3.0 0.0 0.0 movaps %xmm2, (%rdx)
625 # CHECK-NEXT: 3. 1 4.0 0.0 0.0 movaps %xmm3, (%rbx)
626 # CHECK-NEXT: 1 2.5 0.3 0.0 <total>