[ARM] Cortex-M4 schedule additions
[llvm-complete.git] / test / tools / llvm-mca / X86 / Barcelona / load-store-throughput.s
blob27d207990297e8cfa098ed0aa36dad9ad1241895
1 # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2 # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -scheduler-stats -dispatch-stats -iterations=100 -timeline -timeline-max-iterations=1 < %s | FileCheck %s
4 # LLVM-MCA-BEGIN
5 movb %spl, (%rax)
6 movb (%rcx), %bpl
7 movb (%rdx), %sil
8 movb %dil, (%rbx)
9 # LLVM-MCA-END
11 # LLVM-MCA-BEGIN
12 movw %sp, (%rax)
13 movw (%rcx), %bp
14 movw (%rdx), %si
15 movw %di, (%rbx)
16 # LLVM-MCA-END
18 # LLVM-MCA-BEGIN
19 movl %esp, (%rax)
20 movl (%rcx), %ebp
21 movl (%rdx), %esi
22 movl %edi, (%rbx)
23 # LLVM-MCA-END
25 # LLVM-MCA-BEGIN
26 movq %rsp, (%rax)
27 movq (%rcx), %rbp
28 movq (%rdx), %rsi
29 movq %rdi, (%rbx)
30 # LLVM-MCA-END
32 # LLVM-MCA-BEGIN
33 movd %mm0, (%rax)
34 movd (%rcx), %mm1
35 movd (%rdx), %mm2
36 movd %mm3, (%rbx)
37 # LLVM-MCA-END
39 # LLVM-MCA-BEGIN
40 movaps %xmm0, (%rax)
41 movaps (%rcx), %xmm1
42 movaps (%rdx), %xmm2
43 movaps %xmm3, (%rbx)
44 # LLVM-MCA-END
46 # CHECK: [0] Code Region
48 # CHECK: Iterations: 100
49 # CHECK-NEXT: Instructions: 400
50 # CHECK-NEXT: Total Cycles: 208
51 # CHECK-NEXT: Total uOps: 400
53 # CHECK: Dispatch Width: 4
54 # CHECK-NEXT: uOps Per Cycle: 1.92
55 # CHECK-NEXT: IPC: 1.92
56 # CHECK-NEXT: Block RThroughput: 2.0
58 # CHECK: Instruction Info:
59 # CHECK-NEXT: [1]: #uOps
60 # CHECK-NEXT: [2]: Latency
61 # CHECK-NEXT: [3]: RThroughput
62 # CHECK-NEXT: [4]: MayLoad
63 # CHECK-NEXT: [5]: MayStore
64 # CHECK-NEXT: [6]: HasSideEffects (U)
66 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
67 # CHECK-NEXT: 1 1 1.00 * movb %spl, (%rax)
68 # CHECK-NEXT: 1 5 0.50 * movb (%rcx), %bpl
69 # CHECK-NEXT: 1 5 0.50 * movb (%rdx), %sil
70 # CHECK-NEXT: 1 1 1.00 * movb %dil, (%rbx)
72 # CHECK: Dynamic Dispatch Stall Cycles:
73 # CHECK-NEXT: RAT - Register unavailable: 0
74 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
75 # CHECK-NEXT: SCHEDQ - Scheduler full: 147 (70.7%)
76 # CHECK-NEXT: LQ - Load queue full: 0
77 # CHECK-NEXT: SQ - Store queue full: 0
78 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
80 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
81 # CHECK-NEXT: [# dispatched], [# cycles]
82 # CHECK-NEXT: 0, 34 (16.3%)
83 # CHECK-NEXT: 2, 148 (71.2%)
84 # CHECK-NEXT: 4, 26 (12.5%)
86 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
87 # CHECK-NEXT: [# issued], [# cycles]
88 # CHECK-NEXT: 0, 3 (1.4%)
89 # CHECK-NEXT: 1, 10 (4.8%)
90 # CHECK-NEXT: 2, 195 (93.8%)
92 # CHECK: Scheduler's queue usage:
93 # CHECK-NEXT: [1] Resource name.
94 # CHECK-NEXT: [2] Average number of used buffer entries.
95 # CHECK-NEXT: [3] Maximum number of used buffer entries.
96 # CHECK-NEXT: [4] Total number of buffer entries.
98 # CHECK: [1] [2] [3] [4]
99 # CHECK-NEXT: SBPortAny 45 54 54
101 # CHECK: Resources:
102 # CHECK-NEXT: [0] - SBDivider
103 # CHECK-NEXT: [1] - SBFPDivider
104 # CHECK-NEXT: [2] - SBPort0
105 # CHECK-NEXT: [3] - SBPort1
106 # CHECK-NEXT: [4] - SBPort4
107 # CHECK-NEXT: [5] - SBPort5
108 # CHECK-NEXT: [6.0] - SBPort23
109 # CHECK-NEXT: [6.1] - SBPort23
111 # CHECK: Resource pressure per iteration:
112 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
113 # CHECK-NEXT: - - - - 2.00 - 2.00 2.00
115 # CHECK: Resource pressure by instruction:
116 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
117 # CHECK-NEXT: - - - - 1.00 - - 1.00 movb %spl, (%rax)
118 # CHECK-NEXT: - - - - - - 1.00 - movb (%rcx), %bpl
119 # CHECK-NEXT: - - - - - - 0.95 0.05 movb (%rdx), %sil
120 # CHECK-NEXT: - - - - 1.00 - 0.05 0.95 movb %dil, (%rbx)
122 # CHECK: Timeline view:
123 # CHECK-NEXT: Index 0123456789
125 # CHECK: [0,0] DeER . . movb %spl, (%rax)
126 # CHECK-NEXT: [0,1] DeeeeeER . movb (%rcx), %bpl
127 # CHECK-NEXT: [0,2] D=eeeeeER. movb (%rdx), %sil
128 # CHECK-NEXT: [0,3] D======eER movb %dil, (%rbx)
130 # CHECK: Average Wait times (based on the timeline view):
131 # CHECK-NEXT: [0]: Executions
132 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
133 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
134 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
136 # CHECK: [0] [1] [2] [3]
137 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movb %spl, (%rax)
138 # CHECK-NEXT: 1. 1 1.0 1.0 0.0 movb (%rcx), %bpl
139 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 movb (%rdx), %sil
140 # CHECK-NEXT: 3. 1 7.0 0.0 0.0 movb %dil, (%rbx)
142 # CHECK: [1] Code Region
144 # CHECK: Iterations: 100
145 # CHECK-NEXT: Instructions: 400
146 # CHECK-NEXT: Total Cycles: 208
147 # CHECK-NEXT: Total uOps: 400
149 # CHECK: Dispatch Width: 4
150 # CHECK-NEXT: uOps Per Cycle: 1.92
151 # CHECK-NEXT: IPC: 1.92
152 # CHECK-NEXT: Block RThroughput: 2.0
154 # CHECK: Instruction Info:
155 # CHECK-NEXT: [1]: #uOps
156 # CHECK-NEXT: [2]: Latency
157 # CHECK-NEXT: [3]: RThroughput
158 # CHECK-NEXT: [4]: MayLoad
159 # CHECK-NEXT: [5]: MayStore
160 # CHECK-NEXT: [6]: HasSideEffects (U)
162 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
163 # CHECK-NEXT: 1 1 1.00 * movw %sp, (%rax)
164 # CHECK-NEXT: 1 5 0.50 * movw (%rcx), %bp
165 # CHECK-NEXT: 1 5 0.50 * movw (%rdx), %si
166 # CHECK-NEXT: 1 1 1.00 * movw %di, (%rbx)
168 # CHECK: Dynamic Dispatch Stall Cycles:
169 # CHECK-NEXT: RAT - Register unavailable: 0
170 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
171 # CHECK-NEXT: SCHEDQ - Scheduler full: 147 (70.7%)
172 # CHECK-NEXT: LQ - Load queue full: 0
173 # CHECK-NEXT: SQ - Store queue full: 0
174 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
176 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
177 # CHECK-NEXT: [# dispatched], [# cycles]
178 # CHECK-NEXT: 0, 34 (16.3%)
179 # CHECK-NEXT: 2, 148 (71.2%)
180 # CHECK-NEXT: 4, 26 (12.5%)
182 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
183 # CHECK-NEXT: [# issued], [# cycles]
184 # CHECK-NEXT: 0, 3 (1.4%)
185 # CHECK-NEXT: 1, 10 (4.8%)
186 # CHECK-NEXT: 2, 195 (93.8%)
188 # CHECK: Scheduler's queue usage:
189 # CHECK-NEXT: [1] Resource name.
190 # CHECK-NEXT: [2] Average number of used buffer entries.
191 # CHECK-NEXT: [3] Maximum number of used buffer entries.
192 # CHECK-NEXT: [4] Total number of buffer entries.
194 # CHECK: [1] [2] [3] [4]
195 # CHECK-NEXT: SBPortAny 45 54 54
197 # CHECK: Resources:
198 # CHECK-NEXT: [0] - SBDivider
199 # CHECK-NEXT: [1] - SBFPDivider
200 # CHECK-NEXT: [2] - SBPort0
201 # CHECK-NEXT: [3] - SBPort1
202 # CHECK-NEXT: [4] - SBPort4
203 # CHECK-NEXT: [5] - SBPort5
204 # CHECK-NEXT: [6.0] - SBPort23
205 # CHECK-NEXT: [6.1] - SBPort23
207 # CHECK: Resource pressure per iteration:
208 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
209 # CHECK-NEXT: - - - - 2.00 - 2.00 2.00
211 # CHECK: Resource pressure by instruction:
212 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
213 # CHECK-NEXT: - - - - 1.00 - - 1.00 movw %sp, (%rax)
214 # CHECK-NEXT: - - - - - - 1.00 - movw (%rcx), %bp
215 # CHECK-NEXT: - - - - - - 0.95 0.05 movw (%rdx), %si
216 # CHECK-NEXT: - - - - 1.00 - 0.05 0.95 movw %di, (%rbx)
218 # CHECK: Timeline view:
219 # CHECK-NEXT: Index 0123456789
221 # CHECK: [0,0] DeER . . movw %sp, (%rax)
222 # CHECK-NEXT: [0,1] DeeeeeER . movw (%rcx), %bp
223 # CHECK-NEXT: [0,2] D=eeeeeER. movw (%rdx), %si
224 # CHECK-NEXT: [0,3] D======eER movw %di, (%rbx)
226 # CHECK: Average Wait times (based on the timeline view):
227 # CHECK-NEXT: [0]: Executions
228 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
229 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
230 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
232 # CHECK: [0] [1] [2] [3]
233 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movw %sp, (%rax)
234 # CHECK-NEXT: 1. 1 1.0 1.0 0.0 movw (%rcx), %bp
235 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 movw (%rdx), %si
236 # CHECK-NEXT: 3. 1 7.0 0.0 0.0 movw %di, (%rbx)
238 # CHECK: [2] Code Region
240 # CHECK: Iterations: 100
241 # CHECK-NEXT: Instructions: 400
242 # CHECK-NEXT: Total Cycles: 208
243 # CHECK-NEXT: Total uOps: 400
245 # CHECK: Dispatch Width: 4
246 # CHECK-NEXT: uOps Per Cycle: 1.92
247 # CHECK-NEXT: IPC: 1.92
248 # CHECK-NEXT: Block RThroughput: 2.0
250 # CHECK: Instruction Info:
251 # CHECK-NEXT: [1]: #uOps
252 # CHECK-NEXT: [2]: Latency
253 # CHECK-NEXT: [3]: RThroughput
254 # CHECK-NEXT: [4]: MayLoad
255 # CHECK-NEXT: [5]: MayStore
256 # CHECK-NEXT: [6]: HasSideEffects (U)
258 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
259 # CHECK-NEXT: 1 1 1.00 * movl %esp, (%rax)
260 # CHECK-NEXT: 1 5 0.50 * movl (%rcx), %ebp
261 # CHECK-NEXT: 1 5 0.50 * movl (%rdx), %esi
262 # CHECK-NEXT: 1 1 1.00 * movl %edi, (%rbx)
264 # CHECK: Dynamic Dispatch Stall Cycles:
265 # CHECK-NEXT: RAT - Register unavailable: 0
266 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
267 # CHECK-NEXT: SCHEDQ - Scheduler full: 147 (70.7%)
268 # CHECK-NEXT: LQ - Load queue full: 0
269 # CHECK-NEXT: SQ - Store queue full: 0
270 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
272 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
273 # CHECK-NEXT: [# dispatched], [# cycles]
274 # CHECK-NEXT: 0, 34 (16.3%)
275 # CHECK-NEXT: 2, 148 (71.2%)
276 # CHECK-NEXT: 4, 26 (12.5%)
278 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
279 # CHECK-NEXT: [# issued], [# cycles]
280 # CHECK-NEXT: 0, 3 (1.4%)
281 # CHECK-NEXT: 1, 10 (4.8%)
282 # CHECK-NEXT: 2, 195 (93.8%)
284 # CHECK: Scheduler's queue usage:
285 # CHECK-NEXT: [1] Resource name.
286 # CHECK-NEXT: [2] Average number of used buffer entries.
287 # CHECK-NEXT: [3] Maximum number of used buffer entries.
288 # CHECK-NEXT: [4] Total number of buffer entries.
290 # CHECK: [1] [2] [3] [4]
291 # CHECK-NEXT: SBPortAny 45 54 54
293 # CHECK: Resources:
294 # CHECK-NEXT: [0] - SBDivider
295 # CHECK-NEXT: [1] - SBFPDivider
296 # CHECK-NEXT: [2] - SBPort0
297 # CHECK-NEXT: [3] - SBPort1
298 # CHECK-NEXT: [4] - SBPort4
299 # CHECK-NEXT: [5] - SBPort5
300 # CHECK-NEXT: [6.0] - SBPort23
301 # CHECK-NEXT: [6.1] - SBPort23
303 # CHECK: Resource pressure per iteration:
304 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
305 # CHECK-NEXT: - - - - 2.00 - 2.00 2.00
307 # CHECK: Resource pressure by instruction:
308 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
309 # CHECK-NEXT: - - - - 1.00 - - 1.00 movl %esp, (%rax)
310 # CHECK-NEXT: - - - - - - 1.00 - movl (%rcx), %ebp
311 # CHECK-NEXT: - - - - - - 0.95 0.05 movl (%rdx), %esi
312 # CHECK-NEXT: - - - - 1.00 - 0.05 0.95 movl %edi, (%rbx)
314 # CHECK: Timeline view:
315 # CHECK-NEXT: Index 0123456789
317 # CHECK: [0,0] DeER . . movl %esp, (%rax)
318 # CHECK-NEXT: [0,1] DeeeeeER . movl (%rcx), %ebp
319 # CHECK-NEXT: [0,2] D=eeeeeER. movl (%rdx), %esi
320 # CHECK-NEXT: [0,3] D======eER movl %edi, (%rbx)
322 # CHECK: Average Wait times (based on the timeline view):
323 # CHECK-NEXT: [0]: Executions
324 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
325 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
326 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
328 # CHECK: [0] [1] [2] [3]
329 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movl %esp, (%rax)
330 # CHECK-NEXT: 1. 1 1.0 1.0 0.0 movl (%rcx), %ebp
331 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 movl (%rdx), %esi
332 # CHECK-NEXT: 3. 1 7.0 0.0 0.0 movl %edi, (%rbx)
334 # CHECK: [3] Code Region
336 # CHECK: Iterations: 100
337 # CHECK-NEXT: Instructions: 400
338 # CHECK-NEXT: Total Cycles: 208
339 # CHECK-NEXT: Total uOps: 400
341 # CHECK: Dispatch Width: 4
342 # CHECK-NEXT: uOps Per Cycle: 1.92
343 # CHECK-NEXT: IPC: 1.92
344 # CHECK-NEXT: Block RThroughput: 2.0
346 # CHECK: Instruction Info:
347 # CHECK-NEXT: [1]: #uOps
348 # CHECK-NEXT: [2]: Latency
349 # CHECK-NEXT: [3]: RThroughput
350 # CHECK-NEXT: [4]: MayLoad
351 # CHECK-NEXT: [5]: MayStore
352 # CHECK-NEXT: [6]: HasSideEffects (U)
354 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
355 # CHECK-NEXT: 1 1 1.00 * movq %rsp, (%rax)
356 # CHECK-NEXT: 1 5 0.50 * movq (%rcx), %rbp
357 # CHECK-NEXT: 1 5 0.50 * movq (%rdx), %rsi
358 # CHECK-NEXT: 1 1 1.00 * movq %rdi, (%rbx)
360 # CHECK: Dynamic Dispatch Stall Cycles:
361 # CHECK-NEXT: RAT - Register unavailable: 0
362 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
363 # CHECK-NEXT: SCHEDQ - Scheduler full: 147 (70.7%)
364 # CHECK-NEXT: LQ - Load queue full: 0
365 # CHECK-NEXT: SQ - Store queue full: 0
366 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
368 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
369 # CHECK-NEXT: [# dispatched], [# cycles]
370 # CHECK-NEXT: 0, 34 (16.3%)
371 # CHECK-NEXT: 2, 148 (71.2%)
372 # CHECK-NEXT: 4, 26 (12.5%)
374 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
375 # CHECK-NEXT: [# issued], [# cycles]
376 # CHECK-NEXT: 0, 3 (1.4%)
377 # CHECK-NEXT: 1, 10 (4.8%)
378 # CHECK-NEXT: 2, 195 (93.8%)
380 # CHECK: Scheduler's queue usage:
381 # CHECK-NEXT: [1] Resource name.
382 # CHECK-NEXT: [2] Average number of used buffer entries.
383 # CHECK-NEXT: [3] Maximum number of used buffer entries.
384 # CHECK-NEXT: [4] Total number of buffer entries.
386 # CHECK: [1] [2] [3] [4]
387 # CHECK-NEXT: SBPortAny 45 54 54
389 # CHECK: Resources:
390 # CHECK-NEXT: [0] - SBDivider
391 # CHECK-NEXT: [1] - SBFPDivider
392 # CHECK-NEXT: [2] - SBPort0
393 # CHECK-NEXT: [3] - SBPort1
394 # CHECK-NEXT: [4] - SBPort4
395 # CHECK-NEXT: [5] - SBPort5
396 # CHECK-NEXT: [6.0] - SBPort23
397 # CHECK-NEXT: [6.1] - SBPort23
399 # CHECK: Resource pressure per iteration:
400 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
401 # CHECK-NEXT: - - - - 2.00 - 2.00 2.00
403 # CHECK: Resource pressure by instruction:
404 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
405 # CHECK-NEXT: - - - - 1.00 - - 1.00 movq %rsp, (%rax)
406 # CHECK-NEXT: - - - - - - 1.00 - movq (%rcx), %rbp
407 # CHECK-NEXT: - - - - - - 0.95 0.05 movq (%rdx), %rsi
408 # CHECK-NEXT: - - - - 1.00 - 0.05 0.95 movq %rdi, (%rbx)
410 # CHECK: Timeline view:
411 # CHECK-NEXT: Index 0123456789
413 # CHECK: [0,0] DeER . . movq %rsp, (%rax)
414 # CHECK-NEXT: [0,1] DeeeeeER . movq (%rcx), %rbp
415 # CHECK-NEXT: [0,2] D=eeeeeER. movq (%rdx), %rsi
416 # CHECK-NEXT: [0,3] D======eER movq %rdi, (%rbx)
418 # CHECK: Average Wait times (based on the timeline view):
419 # CHECK-NEXT: [0]: Executions
420 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
421 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
422 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
424 # CHECK: [0] [1] [2] [3]
425 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movq %rsp, (%rax)
426 # CHECK-NEXT: 1. 1 1.0 1.0 0.0 movq (%rcx), %rbp
427 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 movq (%rdx), %rsi
428 # CHECK-NEXT: 3. 1 7.0 0.0 0.0 movq %rdi, (%rbx)
430 # CHECK: [4] Code Region
432 # CHECK: Iterations: 100
433 # CHECK-NEXT: Instructions: 400
434 # CHECK-NEXT: Total Cycles: 208
435 # CHECK-NEXT: Total uOps: 400
437 # CHECK: Dispatch Width: 4
438 # CHECK-NEXT: uOps Per Cycle: 1.92
439 # CHECK-NEXT: IPC: 1.92
440 # CHECK-NEXT: Block RThroughput: 2.0
442 # CHECK: Instruction Info:
443 # CHECK-NEXT: [1]: #uOps
444 # CHECK-NEXT: [2]: Latency
445 # CHECK-NEXT: [3]: RThroughput
446 # CHECK-NEXT: [4]: MayLoad
447 # CHECK-NEXT: [5]: MayStore
448 # CHECK-NEXT: [6]: HasSideEffects (U)
450 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
451 # CHECK-NEXT: 1 1 1.00 * U movd %mm0, (%rax)
452 # CHECK-NEXT: 1 5 0.50 * movd (%rcx), %mm1
453 # CHECK-NEXT: 1 5 0.50 * movd (%rdx), %mm2
454 # CHECK-NEXT: 1 1 1.00 * U movd %mm3, (%rbx)
456 # CHECK: Dynamic Dispatch Stall Cycles:
457 # CHECK-NEXT: RAT - Register unavailable: 0
458 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
459 # CHECK-NEXT: SCHEDQ - Scheduler full: 147 (70.7%)
460 # CHECK-NEXT: LQ - Load queue full: 0
461 # CHECK-NEXT: SQ - Store queue full: 0
462 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
464 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
465 # CHECK-NEXT: [# dispatched], [# cycles]
466 # CHECK-NEXT: 0, 34 (16.3%)
467 # CHECK-NEXT: 2, 148 (71.2%)
468 # CHECK-NEXT: 4, 26 (12.5%)
470 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
471 # CHECK-NEXT: [# issued], [# cycles]
472 # CHECK-NEXT: 0, 3 (1.4%)
473 # CHECK-NEXT: 1, 10 (4.8%)
474 # CHECK-NEXT: 2, 195 (93.8%)
476 # CHECK: Scheduler's queue usage:
477 # CHECK-NEXT: [1] Resource name.
478 # CHECK-NEXT: [2] Average number of used buffer entries.
479 # CHECK-NEXT: [3] Maximum number of used buffer entries.
480 # CHECK-NEXT: [4] Total number of buffer entries.
482 # CHECK: [1] [2] [3] [4]
483 # CHECK-NEXT: SBPortAny 45 54 54
485 # CHECK: Resources:
486 # CHECK-NEXT: [0] - SBDivider
487 # CHECK-NEXT: [1] - SBFPDivider
488 # CHECK-NEXT: [2] - SBPort0
489 # CHECK-NEXT: [3] - SBPort1
490 # CHECK-NEXT: [4] - SBPort4
491 # CHECK-NEXT: [5] - SBPort5
492 # CHECK-NEXT: [6.0] - SBPort23
493 # CHECK-NEXT: [6.1] - SBPort23
495 # CHECK: Resource pressure per iteration:
496 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
497 # CHECK-NEXT: - - - - 2.00 - 2.00 2.00
499 # CHECK: Resource pressure by instruction:
500 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
501 # CHECK-NEXT: - - - - 1.00 - - 1.00 movd %mm0, (%rax)
502 # CHECK-NEXT: - - - - - - 1.00 - movd (%rcx), %mm1
503 # CHECK-NEXT: - - - - - - 0.95 0.05 movd (%rdx), %mm2
504 # CHECK-NEXT: - - - - 1.00 - 0.05 0.95 movd %mm3, (%rbx)
506 # CHECK: Timeline view:
507 # CHECK-NEXT: Index 0123456789
509 # CHECK: [0,0] DeER . . movd %mm0, (%rax)
510 # CHECK-NEXT: [0,1] DeeeeeER . movd (%rcx), %mm1
511 # CHECK-NEXT: [0,2] D=eeeeeER. movd (%rdx), %mm2
512 # CHECK-NEXT: [0,3] D======eER movd %mm3, (%rbx)
514 # CHECK: Average Wait times (based on the timeline view):
515 # CHECK-NEXT: [0]: Executions
516 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
517 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
518 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
520 # CHECK: [0] [1] [2] [3]
521 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movd %mm0, (%rax)
522 # CHECK-NEXT: 1. 1 1.0 1.0 0.0 movd (%rcx), %mm1
523 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 movd (%rdx), %mm2
524 # CHECK-NEXT: 3. 1 7.0 0.0 0.0 movd %mm3, (%rbx)
526 # CHECK: [5] Code Region
528 # CHECK: Iterations: 100
529 # CHECK-NEXT: Instructions: 400
530 # CHECK-NEXT: Total Cycles: 209
531 # CHECK-NEXT: Total uOps: 400
533 # CHECK: Dispatch Width: 4
534 # CHECK-NEXT: uOps Per Cycle: 1.91
535 # CHECK-NEXT: IPC: 1.91
536 # CHECK-NEXT: Block RThroughput: 2.0
538 # CHECK: Instruction Info:
539 # CHECK-NEXT: [1]: #uOps
540 # CHECK-NEXT: [2]: Latency
541 # CHECK-NEXT: [3]: RThroughput
542 # CHECK-NEXT: [4]: MayLoad
543 # CHECK-NEXT: [5]: MayStore
544 # CHECK-NEXT: [6]: HasSideEffects (U)
546 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
547 # CHECK-NEXT: 1 1 1.00 * movaps %xmm0, (%rax)
548 # CHECK-NEXT: 1 6 0.50 * movaps (%rcx), %xmm1
549 # CHECK-NEXT: 1 6 0.50 * movaps (%rdx), %xmm2
550 # CHECK-NEXT: 1 1 1.00 * movaps %xmm3, (%rbx)
552 # CHECK: Dynamic Dispatch Stall Cycles:
553 # CHECK-NEXT: RAT - Register unavailable: 0
554 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
555 # CHECK-NEXT: SCHEDQ - Scheduler full: 147 (70.3%)
556 # CHECK-NEXT: LQ - Load queue full: 0
557 # CHECK-NEXT: SQ - Store queue full: 0
558 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
560 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
561 # CHECK-NEXT: [# dispatched], [# cycles]
562 # CHECK-NEXT: 0, 35 (16.7%)
563 # CHECK-NEXT: 2, 148 (70.8%)
564 # CHECK-NEXT: 4, 26 (12.4%)
566 # CHECK: Schedulers - number of cycles where we saw N micro opcodes issued:
567 # CHECK-NEXT: [# issued], [# cycles]
568 # CHECK-NEXT: 0, 3 (1.4%)
569 # CHECK-NEXT: 1, 12 (5.7%)
570 # CHECK-NEXT: 2, 194 (92.8%)
572 # CHECK: Scheduler's queue usage:
573 # CHECK-NEXT: [1] Resource name.
574 # CHECK-NEXT: [2] Average number of used buffer entries.
575 # CHECK-NEXT: [3] Maximum number of used buffer entries.
576 # CHECK-NEXT: [4] Total number of buffer entries.
578 # CHECK: [1] [2] [3] [4]
579 # CHECK-NEXT: SBPortAny 45 54 54
581 # CHECK: Resources:
582 # CHECK-NEXT: [0] - SBDivider
583 # CHECK-NEXT: [1] - SBFPDivider
584 # CHECK-NEXT: [2] - SBPort0
585 # CHECK-NEXT: [3] - SBPort1
586 # CHECK-NEXT: [4] - SBPort4
587 # CHECK-NEXT: [5] - SBPort5
588 # CHECK-NEXT: [6.0] - SBPort23
589 # CHECK-NEXT: [6.1] - SBPort23
591 # CHECK: Resource pressure per iteration:
592 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1]
593 # CHECK-NEXT: - - - - 2.00 - 2.00 2.00
595 # CHECK: Resource pressure by instruction:
596 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
597 # CHECK-NEXT: - - - - 1.00 - - 1.00 movaps %xmm0, (%rax)
598 # CHECK-NEXT: - - - - - - 1.00 - movaps (%rcx), %xmm1
599 # CHECK-NEXT: - - - - - - 0.94 0.06 movaps (%rdx), %xmm2
600 # CHECK-NEXT: - - - - 1.00 - 0.06 0.94 movaps %xmm3, (%rbx)
602 # CHECK: Timeline view:
603 # CHECK-NEXT: 0
604 # CHECK-NEXT: Index 0123456789
606 # CHECK: [0,0] DeER . . movaps %xmm0, (%rax)
607 # CHECK-NEXT: [0,1] DeeeeeeER . movaps (%rcx), %xmm1
608 # CHECK-NEXT: [0,2] D=eeeeeeER. movaps (%rdx), %xmm2
609 # CHECK-NEXT: [0,3] D=======eER movaps %xmm3, (%rbx)
611 # CHECK: Average Wait times (based on the timeline view):
612 # CHECK-NEXT: [0]: Executions
613 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
614 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
615 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
617 # CHECK: [0] [1] [2] [3]
618 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 movaps %xmm0, (%rax)
619 # CHECK-NEXT: 1. 1 1.0 1.0 0.0 movaps (%rcx), %xmm1
620 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 movaps (%rdx), %xmm2
621 # CHECK-NEXT: 3. 1 8.0 0.0 0.0 movaps %xmm3, (%rbx)