1 # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2 # RUN: llvm-mca -mtriple=aarch64 -mcpu=cortex-a57 --instruction-info=0 --resource-pressure=0 --timeline --timeline-max-iterations=1 < %s | FileCheck %s
5 ld1
{ v1.1d
}, [x27
], #8
7 ld1
{ v1.2d
}, [x27
], #16
9 ld1
{ v1.2s
}, [x27
], #8
11 ld1
{ v1.4h
}, [x27
], #8
13 ld1
{ v1.4s
}, [x27
], #16
18 ld1
{ v1.8
b }, [x27
], #8
20 ld1
{ v1.8h
}, [x27
], #16
22 ld1
{ v1.16
b }, [x27
], #16
24 ld1
{ v1.1d
}, [x27
], x28
26 ld1
{ v1.2d
}, [x27
], x28
31 ld1
{ v1.2s
}, [x27
], x28
33 ld1
{ v1.4h
}, [x27
], x28
35 ld1
{ v1.4s
}, [x27
], x28
37 ld1
{ v1.8
b }, [x27
], x28
39 ld1
{ v1.8h
}, [x27
], x28
44 ld1
{ v1.16
b }, [x27
], x28
46 ld1
{ v1.1d
, v2.1d
}, [x27
], #16
48 ld1
{ v1.2d
, v2.2d
}, [x27
], #32
50 ld1
{ v1.2s
, v2.2s
}, [x27
], #16
52 ld1
{ v1.4h
, v2.4h
}, [x27
], #16
57 ld1
{ v1.4s
, v2.4s
}, [x27
], #32
59 ld1
{ v1.8
b, v2.8
b }, [x27
], #16
61 ld1
{ v1.8h
, v2.8h
}, [x27
], #32
63 ld1
{ v1.16
b, v2.16
b }, [x27
], #32
65 ld1
{ v1.1d
, v2.1d
}, [x27
], x28
70 ld1
{ v1.2d
, v2.2d
}, [x27
], x28
72 ld1
{ v1.2s
, v2.2s
}, [x27
], x28
74 ld1
{ v1.4h
, v2.4h
}, [x27
], x28
76 ld1
{ v1.4s
, v2.4s
}, [x27
], x28
78 ld1
{ v1.8
b, v2.8
b }, [x27
], x28
83 ld1
{ v1.8h
, v2.8h
}, [x27
], x28
85 ld1
{ v1.16
b, v2.16
b }, [x27
], x28
87 ld1
{ v1.1d
, v2.1d
, v3.1d
}, [x27
], #24
89 ld1
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], #48
91 ld1
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], #24
96 ld1
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], #24
98 ld1
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], #48
100 ld1
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], #24
102 ld1
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], #48
104 ld1
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], #48
109 ld1
{ v1.1d
, v2.1d
, v3.1d
}, [x27
], x28
111 ld1
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], x28
113 ld1
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], x28
115 ld1
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], x28
117 ld1
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], x28
122 ld1
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], x28
124 ld1
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], x28
126 ld1
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], x28
128 ld1
{ v1.1d
, v2.1d
, v3.1d
, v4.1d
}, [x27
], #32
130 ld1
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], #64
135 ld1
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], #32
137 ld1
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], #32
139 ld1
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], #64
141 ld1
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], #32
143 ld1
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], #64
148 ld1
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], #64
150 ld1
{ v1.1d
, v2.1d
, v3.1d
, v4.1d
}, [x27
], x28
152 ld1
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], x28
154 ld1
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], x28
156 ld1
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], x28
161 ld1
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], x28
163 ld1
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], x28
165 ld1
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], x28
167 ld1
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], x28
169 ld1
{ v1.
b }[0], [x27
], #1
174 ld1
{ v1.
b }[8], [x27
], #1
176 ld1
{ v1.
b }[0], [x27
], x28
178 ld1
{ v1.
b }[8], [x27
], x28
180 ld1
{ v1.h
}[0], [x27
], #2
182 ld1
{ v1.h
}[4], [x27
], #2
187 ld1
{ v1.h
}[0], [x27
], x28
189 ld1
{ v1.h
}[4], [x27
], x28
191 ld1
{ v1.s
}[0], [x27
], #4
193 ld1
{ v1.s
}[0], [x27
], x28
195 ld1
{ v1.d
}[0], [x27
], #8
200 ld1
{ v1.d
}[0], [x27
], x28
202 ld1r
{ v1.1d
}, [x27
], #8
204 ld1r
{ v1.2d
}, [x27
], #8
206 ld1r
{ v1.2s
}, [x27
], #4
208 ld1r
{ v1.4h
}, [x27
], #2
213 ld1r
{ v1.4s
}, [x27
], #4
215 ld1r
{ v1.8
b }, [x27
], #1
217 ld1r
{ v1.8h
}, [x27
], #2
219 ld1r
{ v1.16
b }, [x27
], #1
221 ld1r
{ v1.1d
}, [x27
], x28
226 ld1r
{ v1.2d
}, [x27
], x28
228 ld1r
{ v1.2s
}, [x27
], x28
230 ld1r
{ v1.4h
}, [x27
], x28
232 ld1r
{ v1.4s
}, [x27
], x28
234 ld1r
{ v1.8
b }, [x27
], x28
239 ld1r
{ v1.8h
}, [x27
], x28
241 ld1r
{ v1.16
b }, [x27
], x28
243 ld2
{ v1.2d
, v2.2d
}, [x27
], #32
245 ld2
{ v1.2s
, v2.2s
}, [x27
], #16
247 ld2
{ v1.4h
, v2.4h
}, [x27
], #16
252 ld2
{ v1.4s
, v2.4s
}, [x27
], #32
254 ld2
{ v1.8
b, v2.8
b }, [x27
], #16
256 ld2
{ v1.8h
, v2.8h
}, [x27
], #32
258 ld2
{ v1.16
b, v2.16
b }, [x27
], #32
260 ld2
{ v1.2d
, v2.2d
}, [x27
], x28
265 ld2
{ v1.2s
, v2.2s
}, [x27
], x28
267 ld2
{ v1.4h
, v2.4h
}, [x27
], x28
269 ld2
{ v1.4s
, v2.4s
}, [x27
], x28
271 ld2
{ v1.8
b, v2.8
b }, [x27
], x28
273 ld2
{ v1.8h
, v2.8h
}, [x27
], x28
278 ld2
{ v1.16
b, v2.16
b }, [x27
], x28
280 ld2
{ v1.
b, v2.
b }[0], [x27
], #2
282 ld2
{ v1.
b, v2.
b }[8], [x27
], #2
284 ld2
{ v1.
b, v2.
b }[0], [x27
], x28
286 ld2
{ v1.
b, v2.
b }[8], [x27
], x28
291 ld2
{ v1.h
, v2.h
}[0], [x27
], #4
293 ld2
{ v1.h
, v2.h
}[4], [x27
], #4
295 ld2
{ v1.h
, v2.h
}[0], [x27
], x28
297 ld2
{ v1.h
, v2.h
}[4], [x27
], x28
299 ld2
{ v1.s
, v2.s
}[0], [x27
], #8
304 ld2
{ v1.s
, v2.s
}[0], [x27
], x28
306 ld2
{ v1.d
, v2.d
}[0], [x27
], #16
308 ld2
{ v1.d
, v2.d
}[0], [x27
], x28
310 ld2r
{ v1.1d
, v2.1d
}, [x27
], #16
312 ld2r
{ v1.2d
, v2.2d
}, [x27
], #16
317 ld2r
{ v1.2s
, v2.2s
}, [x27
], #8
319 ld2r
{ v1.4h
, v2.4h
}, [x27
], #4
321 ld2r
{ v1.4s
, v2.4s
}, [x27
], #8
323 ld2r
{ v1.8
b, v2.8
b }, [x27
], #2
325 ld2r
{ v1.8h
, v2.8h
}, [x27
], #4
330 ld2r
{ v1.16
b, v2.16
b }, [x27
], #2
332 ld2r
{ v1.1d
, v2.1d
}, [x27
], x28
334 ld2r
{ v1.2d
, v2.2d
}, [x27
], x28
336 ld2r
{ v1.2s
, v2.2s
}, [x27
], x28
338 ld2r
{ v1.4h
, v2.4h
}, [x27
], x28
343 ld2r
{ v1.4s
, v2.4s
}, [x27
], x28
345 ld2r
{ v1.8
b, v2.8
b }, [x27
], x28
347 ld2r
{ v1.8h
, v2.8h
}, [x27
], x28
349 ld2r
{ v1.16
b, v2.16
b }, [x27
], x28
351 ld3
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], #48
356 ld3
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], #24
358 ld3
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], #24
360 ld3
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], #48
362 ld3
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], #24
364 ld3
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], #48
369 ld3
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], #48
371 ld3
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], x28
373 ld3
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], x28
375 ld3
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], x28
377 ld3
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], x28
382 ld3
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], x28
384 ld3
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], x28
386 ld3
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], x28
388 ld3
{ v1.
b, v2.
b, v3.
b }[0], [x27
], #3
390 ld3
{ v1.
b, v2.
b, v3.
b }[8], [x27
], #3
395 ld3
{ v1.
b, v2.
b, v3.
b }[0], [x27
], x28
397 ld3
{ v1.
b, v2.
b, v3.
b }[8], [x27
], x28
399 ld3
{ v1.h
, v2.h
, v3.h
}[0], [x27
], #6
401 ld3
{ v1.h
, v2.h
, v3.h
}[4], [x27
], #6
403 ld3
{ v1.h
, v2.h
, v3.h
}[0], [x27
], x28
408 ld3
{ v1.h
, v2.h
, v3.h
}[4], [x27
], x28
410 ld3
{ v1.s
, v2.s
, v3.s
}[0], [x27
], #12
412 ld3
{ v1.s
, v2.s
, v3.s
}[0], [x27
], x28
414 ld3
{ v1.d
, v2.d
, v3.d
}[0], [x27
], #24
416 ld3
{ v1.d
, v2.d
, v3.d
}[0], [x27
], x28
421 ld3r
{ v1.1d
, v2.1d
, v3.1d
}, [x27
], #24
423 ld3r
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], #24
425 ld3r
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], #12
427 ld3r
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], #6
429 ld3r
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], #12
434 ld3r
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], #3
436 ld3r
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], #6
438 ld3r
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], #3
440 ld3r
{ v1.1d
, v2.1d
, v3.1d
}, [x27
], x28
442 ld3r
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], x28
447 ld3r
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], x28
449 ld3r
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], x28
451 ld3r
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], x28
453 ld3r
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], x28
455 ld3r
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], x28
460 ld3r
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], x28
462 ld4
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], #64
464 ld4
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], #32
466 ld4
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], #32
468 ld4
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], #64
473 ld4
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], #32
475 ld4
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], #64
477 ld4
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], #64
479 ld4
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], x28
481 ld4
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], x28
486 ld4
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], x28
488 ld4
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], x28
490 ld4
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], x28
492 ld4
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], x28
494 ld4
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], x28
499 ld4
{ v1.
b, v2.
b, v3.
b, v4.
b }[0], [x27
], #4
501 ld4
{ v1.
b, v2.
b, v3.
b, v4.
b }[8], [x27
], #4
503 ld4
{ v1.
b, v2.
b, v3.
b, v4.
b }[0], [x27
], x28
505 ld4
{ v1.
b, v2.
b, v3.
b, v4.
b }[8], [x27
], x28
507 ld4
{ v1.h
, v2.h
, v3.h
, v4.h
}[0], [x27
], #8
512 ld4
{ v1.h
, v2.h
, v3.h
, v4.h
}[4], [x27
], #8
514 ld4
{ v1.h
, v2.h
, v3.h
, v4.h
}[0], [x27
], x28
516 ld4
{ v1.h
, v2.h
, v3.h
, v4.h
}[4], [x27
], x28
518 ld4
{ v1.s
, v2.s
, v3.s
, v4.s
}[0], [x27
], #16
520 ld4
{ v1.s
, v2.s
, v3.s
, v4.s
}[0], [x27
], x28
525 ld4
{ v1.d
, v2.d
, v3.d
, v4.d
}[0], [x27
], #32
527 ld4
{ v1.d
, v2.d
, v3.d
, v4.d
}[0], [x27
], x28
529 ld4r
{ v1.1d
, v2.1d
, v3.1d
, v4.1d
}, [x27
], #32
531 ld4r
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], #32
533 ld4r
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], #16
538 ld4r
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], #8
540 ld4r
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], #16
542 ld4r
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], #4
544 ld4r
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], #8
546 ld4r
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], #4
551 ld4r
{ v1.1d
, v2.1d
, v3.1d
, v4.1d
}, [x27
], x28
553 ld4r
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], x28
555 ld4r
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], x28
557 ld4r
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], x28
559 ld4r
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], x28
564 ld4r
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], x28
566 ld4r
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], x28
568 ld4r
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], x28
570 ldp s1
, s2
, [x27
], #248
572 ldp d1
, d2
, [x27
], #496
577 ldp q1
, q2
, [x27
], #992
579 ldp s1
, s2
, [x27
, #248]!
581 ldp d1
, d2
, [x27
, #496]!
583 ldp q1
, q2
, [x27
, #992]!
585 ldp w1
, w2
, [x27
], #248
590 ldp x1
, x2
, [x27
], #496
592 ldp w1
, w2
, [x27
, #248]!
594 ldp x1
, x2
, [x27
, #496]!
596 ldpsw x1
, x2
, [x27
], #248
598 ldpsw x1
, x2
, [x27
, #248]!
642 ldrb w1
, [x27
, #254]!
646 ldrh w1
, [x27
, #254]!
648 ldrsb w1
, [x27
], #254
650 ldrsb x1
, [x27
], #254
655 ldrsb w1
, [x27
, #254]!
657 ldrsb x1
, [x27
, #254]!
659 ldrsh w1
, [x27
], #254
661 ldrsh x1
, [x27
], #254
663 ldrsh w1
, [x27
, #254]!
668 ldrsh x1
, [x27
, #254]!
670 ldrsw x1
, [x27
], #254
672 ldrsw x1
, [x27
, #254]!
674 st1
{ v1.1d
}, [x27
], #8
676 st1
{ v1.2d
}, [x27
], #16
681 st1
{ v1.2s
}, [x27
], #8
683 st1
{ v1.4h
}, [x27
], #8
685 st1
{ v1.4s
}, [x27
], #16
687 st1
{ v1.8
b }, [x27
], #8
689 st1
{ v1.8h
}, [x27
], #16
694 st1
{ v1.16
b }, [x27
], #16
696 st1
{ v1.1d
}, [x27
], x28
698 st1
{ v1.2d
}, [x27
], x28
700 st1
{ v1.2s
}, [x27
], x28
702 st1
{ v1.4h
}, [x27
], x28
707 st1
{ v1.4s
}, [x27
], x28
709 st1
{ v1.8
b }, [x27
], x28
711 st1
{ v1.8h
}, [x27
], x28
713 st1
{ v1.16
b }, [x27
], x28
715 st1
{ v1.1d
, v2.1d
}, [x27
], #16
720 st1
{ v1.2d
, v2.2d
}, [x27
], #32
722 st1
{ v1.2s
, v2.2s
}, [x27
], #16
724 st1
{ v1.4h
, v2.4h
}, [x27
], #16
726 st1
{ v1.4s
, v2.4s
}, [x27
], #32
728 st1
{ v1.8
b, v2.8
b }, [x27
], #16
733 st1
{ v1.8h
, v2.8h
}, [x27
], #32
735 st1
{ v1.16
b, v2.16
b }, [x27
], #32
737 st1
{ v1.1d
, v2.1d
}, [x27
], x28
739 st1
{ v1.2d
, v2.2d
}, [x27
], x28
741 st1
{ v1.2s
, v2.2s
}, [x27
], x28
746 st1
{ v1.4h
, v2.4h
}, [x27
], x28
748 st1
{ v1.4s
, v2.4s
}, [x27
], x28
750 st1
{ v1.8
b, v2.8
b }, [x27
], x28
752 st1
{ v1.8h
, v2.8h
}, [x27
], x28
754 st1
{ v1.16
b, v2.16
b }, [x27
], x28
759 st1
{ v1.1d
, v2.1d
, v3.1d
}, [x27
], #24
761 st1
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], #48
763 st1
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], #24
765 st1
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], #24
767 st1
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], #48
772 st1
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], #24
774 st1
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], #48
776 st1
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], #48
778 st1
{ v1.1d
, v2.1d
, v3.1d
}, [x27
], x28
780 st1
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], x28
785 st1
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], x28
787 st1
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], x28
789 st1
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], x28
791 st1
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], x28
793 st1
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], x28
798 st1
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], x28
800 st1
{ v1.1d
, v2.1d
, v3.1d
, v4.1d
}, [x27
], #32
802 st1
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], #64
804 st1
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], #32
806 st1
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], #32
811 st1
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], #64
813 st1
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], #32
815 st1
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], #64
817 st1
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], #64
819 st1
{ v1.1d
, v2.1d
, v3.1d
, v4.1d
}, [x27
], x28
824 st1
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], x28
826 st1
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], x28
828 st1
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], x28
830 st1
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], x28
832 st1
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], x28
837 st1
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], x28
839 st1
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], x28
841 st1
{ v1.
b }[0], [x27
], #1
843 st1
{ v1.
b }[8], [x27
], #1
845 st1
{ v1.
b }[0], [x27
], x28
850 st1
{ v1.
b }[8], [x27
], x28
852 st1
{ v1.h
}[0], [x27
], #2
854 st1
{ v1.h
}[4], [x27
], #2
856 st1
{ v1.h
}[0], [x27
], x28
858 st1
{ v1.h
}[4], [x27
], x28
863 st1
{ v1.s
}[0], [x27
], #4
865 st1
{ v1.s
}[0], [x27
], x28
867 st1
{ v1.d
}[0], [x27
], #8
869 st1
{ v1.d
}[0], [x27
], x28
871 st2
{ v1.2d
, v2.2d
}, [x27
], #32
876 st2
{ v1.2s
, v2.2s
}, [x27
], #16
878 st2
{ v1.4h
, v2.4h
}, [x27
], #16
880 st2
{ v1.4s
, v2.4s
}, [x27
], #32
882 st2
{ v1.8
b, v2.8
b }, [x27
], #16
884 st2
{ v1.8h
, v2.8h
}, [x27
], #32
889 st2
{ v1.16
b, v2.16
b }, [x27
], #32
891 st2
{ v1.2d
, v2.2d
}, [x27
], x28
893 st2
{ v1.2s
, v2.2s
}, [x27
], x28
895 st2
{ v1.4h
, v2.4h
}, [x27
], x28
897 st2
{ v1.4s
, v2.4s
}, [x27
], x28
902 st2
{ v1.8
b, v2.8
b }, [x27
], x28
904 st2
{ v1.8h
, v2.8h
}, [x27
], x28
906 st2
{ v1.16
b, v2.16
b }, [x27
], x28
908 st2
{ v1.
b, v2.
b }[0], [x27
], #2
910 st2
{ v1.
b, v2.
b }[8], [x27
], #2
915 st2
{ v1.
b, v2.
b }[0], [x27
], x28
917 st2
{ v1.
b, v2.
b }[8], [x27
], x28
919 st2
{ v1.h
, v2.h
}[0], [x27
], #4
921 st2
{ v1.h
, v2.h
}[4], [x27
], #4
923 st2
{ v1.h
, v2.h
}[0], [x27
], x28
928 st2
{ v1.h
, v2.h
}[4], [x27
], x28
930 st2
{ v1.s
, v2.s
}[0], [x27
], #8
932 st2
{ v1.s
, v2.s
}[0], [x27
], x28
934 st2
{ v1.d
, v2.d
}[0], [x27
], #16
936 st2
{ v1.d
, v2.d
}[0], [x27
], x28
941 st3
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], #48
943 st3
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], #24
945 st3
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], #24
950 st3
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], #48
952 st3
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], #24
954 st3
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], #48
956 st3
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], #48
958 st3
{ v1.2d
, v2.2d
, v3.2d
}, [x27
], x28
963 st3
{ v1.2s
, v2.2s
, v3.2s
}, [x27
], x28
965 st3
{ v1.4h
, v2.4h
, v3.4h
}, [x27
], x28
967 st3
{ v1.4s
, v2.4s
, v3.4s
}, [x27
], x28
969 st3
{ v1.8
b, v2.8
b, v3.8
b }, [x27
], x28
971 st3
{ v1.8h
, v2.8h
, v3.8h
}, [x27
], x28
976 st3
{ v1.16
b, v2.16
b, v3.16
b }, [x27
], x28
978 st3
{ v1.
b, v2.
b, v3.
b }[0], [x27
], #3
980 st3
{ v1.
b, v2.
b, v3.
b }[8], [x27
], #3
982 st3
{ v1.
b, v2.
b, v3.
b }[0], [x27
], x28
984 st3
{ v1.
b, v2.
b, v3.
b }[8], [x27
], x28
989 st3
{ v1.h
, v2.h
, v3.h
}[0], [x27
], #6
991 st3
{ v1.h
, v2.h
, v3.h
}[4], [x27
], #6
993 st3
{ v1.h
, v2.h
, v3.h
}[0], [x27
], x28
995 st3
{ v1.h
, v2.h
, v3.h
}[4], [x27
], x28
997 st3
{ v1.s
, v2.s
, v3.s
}[0], [x27
], #12
1001 # LLVM-MCA-BEGIN G78
1002 st3
{ v1.s
, v2.s
, v3.s
}[0], [x27
], x28
1004 st3
{ v1.d
, v2.d
, v3.d
}[0], [x27
], #24
1006 st3
{ v1.d
, v2.d
, v3.d
}[0], [x27
], x28
1008 st4
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], #64
1010 st4
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], #32
1014 # LLVM-MCA-BEGIN G79
1015 st4
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], #32
1017 st4
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], #64
1019 st4
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], #32
1021 st4
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], #64
1023 st4
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], #64
1027 # LLVM-MCA-BEGIN G80
1028 st4
{ v1.2d
, v2.2d
, v3.2d
, v4.2d
}, [x27
], x28
1030 st4
{ v1.2s
, v2.2s
, v3.2s
, v4.2s
}, [x27
], x28
1032 st4
{ v1.4h
, v2.4h
, v3.4h
, v4.4h
}, [x27
], x28
1034 st4
{ v1.4s
, v2.4s
, v3.4s
, v4.4s
}, [x27
], x28
1036 st4
{ v1.8
b, v2.8
b, v3.8
b, v4.8
b }, [x27
], x28
1040 # LLVM-MCA-BEGIN G81
1041 st4
{ v1.8h
, v2.8h
, v3.8h
, v4.8h
}, [x27
], x28
1043 st4
{ v1.16
b, v2.16
b, v3.16
b, v4.16
b }, [x27
], x28
1045 st4
{ v1.
b, v2.
b, v3.
b, v4.
b }[0], [x27
], #4
1047 st4
{ v1.
b, v2.
b, v3.
b, v4.
b }[8], [x27
], #4
1049 st4
{ v1.
b, v2.
b, v3.
b, v4.
b }[0], [x27
], x28
1053 # LLVM-MCA-BEGIN G82
1054 st4
{ v1.
b, v2.
b, v3.
b, v4.
b }[8], [x27
], x28
1056 st4
{ v1.h
, v2.h
, v3.h
, v4.h
}[0], [x27
], #8
1058 st4
{ v1.h
, v2.h
, v3.h
, v4.h
}[4], [x27
], #8
1060 st4
{ v1.h
, v2.h
, v3.h
, v4.h
}[0], [x27
], x28
1062 st4
{ v1.h
, v2.h
, v3.h
, v4.h
}[4], [x27
], x28
1066 # LLVM-MCA-BEGIN G83
1067 st4
{ v1.s
, v2.s
, v3.s
, v4.s
}[0], [x27
], #16
1069 st4
{ v1.s
, v2.s
, v3.s
, v4.s
}[0], [x27
], x28
1071 st4
{ v1.d
, v2.d
, v3.d
, v4.d
}[0], [x27
], #32
1073 st4
{ v1.d
, v2.d
, v3.d
, v4.d
}[0], [x27
], x28
1077 # LLVM-MCA-BEGIN G84
1078 stp s1
, s2
, [x27
], #248
1080 stp d1
, d2
, [x27
], #496
1084 # LLVM-MCA-BEGIN G85
1085 stp q1
, q2
, [x27
], #992
1087 stp s1
, s2
, [x27
, #248]!
1089 stp d1
, d2
, [x27
, #496]!
1091 stp q1
, q2
, [x27
, #992]!
1093 stp w1
, w2
, [x27
], #248
1097 # LLVM-MCA-BEGIN G86
1098 stp x1
, x2
, [x27
], #496
1100 stp w1
, w2
, [x27
, #248]!
1102 stp x1
, x2
, [x27
, #496]!
1110 # LLVM-MCA-BEGIN G87
1117 str b1
, [x27
, #254]!
1119 str h1
, [x27
, #254]!
1123 # LLVM-MCA-BEGIN G88
1124 str s1
, [x27
, #254]!
1126 str d1
, [x27
, #254]!
1128 str q1
, [x27
, #254]!
1136 # LLVM-MCA-BEGIN G89
1137 str w1
, [x27
, #254]!
1139 str x1
, [x27
, #254]!
1141 strb w1
, [x27
], #254
1143 strb w1
, [x27
, #254]!
1145 strh w1
, [x27
], #254
1149 # LLVM-MCA-BEGIN G90
1150 strh w1
, [x27
, #254]!
1154 # LLVM-MCA-BEGIN G91
1161 # CHECK: [0] Code Region - G01
1163 # CHECK: Iterations: 100
1164 # CHECK-NEXT: Instructions: 1000
1165 # CHECK-NEXT: Total Cycles: 507
1166 # CHECK-NEXT: Total uOps: 1500
1168 # CHECK: Dispatch Width: 3
1169 # CHECK-NEXT: uOps Per Cycle: 2.96
1170 # CHECK-NEXT: IPC: 1.97
1171 # CHECK-NEXT: Block RThroughput: 5.0
1173 # CHECK: Timeline view:
1175 # CHECK-NEXT: Index 0123456789
1177 # CHECK: [0,0] DeeeeeER .. ld1 { v1.1d }, [x27], #8
1178 # CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1
1179 # CHECK-NEXT: [0,2] .DeeeeeER .. ld1 { v1.2d }, [x27], #16
1180 # CHECK-NEXT: [0,3] .D=eE---R .. add x0, x27, #1
1181 # CHECK-NEXT: [0,4] . DeeeeeER.. ld1 { v1.2s }, [x27], #8
1182 # CHECK-NEXT: [0,5] . D=eE---R.. add x0, x27, #1
1183 # CHECK-NEXT: [0,6] . DeeeeeER. ld1 { v1.4h }, [x27], #8
1184 # CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1
1185 # CHECK-NEXT: [0,8] . DeeeeeER ld1 { v1.4s }, [x27], #16
1186 # CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1
1188 # CHECK: Average Wait times (based on the timeline view):
1189 # CHECK-NEXT: [0]: Executions
1190 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1191 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1192 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1194 # CHECK: [0] [1] [2] [3]
1195 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.1d }, [x27], #8
1196 # CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1
1197 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1 { v1.2d }, [x27], #16
1198 # CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1
1199 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.2s }, [x27], #8
1200 # CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1
1201 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld1 { v1.4h }, [x27], #8
1202 # CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1
1203 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 ld1 { v1.4s }, [x27], #16
1204 # CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1
1205 # CHECK-NEXT: 1 1.5 0.1 1.5 <total>
1207 # CHECK: [1] Code Region - G02
1209 # CHECK: Iterations: 100
1210 # CHECK-NEXT: Instructions: 1000
1211 # CHECK-NEXT: Total Cycles: 507
1212 # CHECK-NEXT: Total uOps: 1500
1214 # CHECK: Dispatch Width: 3
1215 # CHECK-NEXT: uOps Per Cycle: 2.96
1216 # CHECK-NEXT: IPC: 1.97
1217 # CHECK-NEXT: Block RThroughput: 5.0
1219 # CHECK: Timeline view:
1221 # CHECK-NEXT: Index 0123456789
1223 # CHECK: [0,0] DeeeeeER .. ld1 { v1.8b }, [x27], #8
1224 # CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1
1225 # CHECK-NEXT: [0,2] .DeeeeeER .. ld1 { v1.8h }, [x27], #16
1226 # CHECK-NEXT: [0,3] .D=eE---R .. add x0, x27, #1
1227 # CHECK-NEXT: [0,4] . DeeeeeER.. ld1 { v1.16b }, [x27], #16
1228 # CHECK-NEXT: [0,5] . D=eE---R.. add x0, x27, #1
1229 # CHECK-NEXT: [0,6] . DeeeeeER. ld1 { v1.1d }, [x27], x28
1230 # CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1
1231 # CHECK-NEXT: [0,8] . DeeeeeER ld1 { v1.2d }, [x27], x28
1232 # CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1
1234 # CHECK: Average Wait times (based on the timeline view):
1235 # CHECK-NEXT: [0]: Executions
1236 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1237 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1238 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1240 # CHECK: [0] [1] [2] [3]
1241 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8b }, [x27], #8
1242 # CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1
1243 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1 { v1.8h }, [x27], #16
1244 # CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1
1245 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.16b }, [x27], #16
1246 # CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1
1247 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld1 { v1.1d }, [x27], x28
1248 # CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1
1249 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 ld1 { v1.2d }, [x27], x28
1250 # CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1
1251 # CHECK-NEXT: 1 1.5 0.1 1.5 <total>
1253 # CHECK: [2] Code Region - G03
1255 # CHECK: Iterations: 100
1256 # CHECK-NEXT: Instructions: 1000
1257 # CHECK-NEXT: Total Cycles: 507
1258 # CHECK-NEXT: Total uOps: 1500
1260 # CHECK: Dispatch Width: 3
1261 # CHECK-NEXT: uOps Per Cycle: 2.96
1262 # CHECK-NEXT: IPC: 1.97
1263 # CHECK-NEXT: Block RThroughput: 5.0
1265 # CHECK: Timeline view:
1267 # CHECK-NEXT: Index 0123456789
1269 # CHECK: [0,0] DeeeeeER .. ld1 { v1.2s }, [x27], x28
1270 # CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1
1271 # CHECK-NEXT: [0,2] .DeeeeeER .. ld1 { v1.4h }, [x27], x28
1272 # CHECK-NEXT: [0,3] .D=eE---R .. add x0, x27, #1
1273 # CHECK-NEXT: [0,4] . DeeeeeER.. ld1 { v1.4s }, [x27], x28
1274 # CHECK-NEXT: [0,5] . D=eE---R.. add x0, x27, #1
1275 # CHECK-NEXT: [0,6] . DeeeeeER. ld1 { v1.8b }, [x27], x28
1276 # CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1
1277 # CHECK-NEXT: [0,8] . DeeeeeER ld1 { v1.8h }, [x27], x28
1278 # CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1
1280 # CHECK: Average Wait times (based on the timeline view):
1281 # CHECK-NEXT: [0]: Executions
1282 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1283 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1284 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1286 # CHECK: [0] [1] [2] [3]
1287 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2s }, [x27], x28
1288 # CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1
1289 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1 { v1.4h }, [x27], x28
1290 # CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1
1291 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.4s }, [x27], x28
1292 # CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1
1293 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld1 { v1.8b }, [x27], x28
1294 # CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1
1295 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 ld1 { v1.8h }, [x27], x28
1296 # CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1
1297 # CHECK-NEXT: 1 1.5 0.1 1.5 <total>
1299 # CHECK: [3] Code Region - G04
1301 # CHECK: Iterations: 100
1302 # CHECK-NEXT: Instructions: 1000
1303 # CHECK-NEXT: Total Cycles: 607
1304 # CHECK-NEXT: Total uOps: 1600
1306 # CHECK: Dispatch Width: 3
1307 # CHECK-NEXT: uOps Per Cycle: 2.64
1308 # CHECK-NEXT: IPC: 1.65
1309 # CHECK-NEXT: Block RThroughput: 6.0
1311 # CHECK: Timeline view:
1313 # CHECK-NEXT: Index 0123456789
1315 # CHECK: [0,0] DeeeeeER . . ld1 { v1.16b }, [x27], x28
1316 # CHECK-NEXT: [0,1] D=eE---R . . add x0, x27, #1
1317 # CHECK-NEXT: [0,2] .DeeeeeER . . ld1 { v1.1d, v2.1d }, [x27], #16
1318 # CHECK-NEXT: [0,3] .D=eE---R . . add x0, x27, #1
1319 # CHECK-NEXT: [0,4] . DeeeeeeER . ld1 { v1.2d, v2.2d }, [x27], #32
1320 # CHECK-NEXT: [0,5] . DeE----R . add x0, x27, #1
1321 # CHECK-NEXT: [0,6] . D=eeeeeER. ld1 { v1.2s, v2.2s }, [x27], #16
1322 # CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1
1323 # CHECK-NEXT: [0,8] . D=eeeeeER ld1 { v1.4h, v2.4h }, [x27], #16
1324 # CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1
1326 # CHECK: Average Wait times (based on the timeline view):
1327 # CHECK-NEXT: [0]: Executions
1328 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1329 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1330 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1332 # CHECK: [0] [1] [2] [3]
1333 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.16b }, [x27], x28
1334 # CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1
1335 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1 { v1.1d, v2.1d }, [x27], #16
1336 # CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1
1337 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.2d, v2.2d }, [x27], #32
1338 # CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1
1339 # CHECK-NEXT: 6. 1 2.0 1.0 0.0 ld1 { v1.2s, v2.2s }, [x27], #16
1340 # CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1
1341 # CHECK-NEXT: 8. 1 2.0 0.0 0.0 ld1 { v1.4h, v2.4h }, [x27], #16
1342 # CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1
1343 # CHECK-NEXT: 1 1.6 0.2 1.6 <total>
1345 # CHECK: [4] Code Region - G05
1347 # CHECK: Iterations: 100
1348 # CHECK-NEXT: Instructions: 1000
1349 # CHECK-NEXT: Total Cycles: 807
1350 # CHECK-NEXT: Total uOps: 1800
1352 # CHECK: Dispatch Width: 3
1353 # CHECK-NEXT: uOps Per Cycle: 2.23
1354 # CHECK-NEXT: IPC: 1.24
1355 # CHECK-NEXT: Block RThroughput: 8.0
1357 # CHECK: Timeline view:
1359 # CHECK-NEXT: Index 0123456789
1361 # CHECK: [0,0] DeeeeeeER . . ld1 { v1.4s, v2.4s }, [x27], #32
1362 # CHECK-NEXT: [0,1] .DeE----R . . add x0, x27, #1
1363 # CHECK-NEXT: [0,2] .D=eeeeeER. . ld1 { v1.8b, v2.8b }, [x27], #16
1364 # CHECK-NEXT: [0,3] . D=eE---R. . add x0, x27, #1
1365 # CHECK-NEXT: [0,4] . DeeeeeeER . ld1 { v1.8h, v2.8h }, [x27], #32
1366 # CHECK-NEXT: [0,5] . DeE----R . add x0, x27, #1
1367 # CHECK-NEXT: [0,6] . DeeeeeeER. ld1 { v1.16b, v2.16b }, [x27], #32
1368 # CHECK-NEXT: [0,7] . .DeE----R. add x0, x27, #1
1369 # CHECK-NEXT: [0,8] . .D=eeeeeER ld1 { v1.1d, v2.1d }, [x27], x28
1370 # CHECK-NEXT: [0,9] . . D=eE---R add x0, x27, #1
1372 # CHECK: Average Wait times (based on the timeline view):
1373 # CHECK-NEXT: [0]: Executions
1374 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1375 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1376 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1378 # CHECK: [0] [1] [2] [3]
1379 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s }, [x27], #32
1380 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
1381 # CHECK-NEXT: 2. 1 2.0 1.0 0.0 ld1 { v1.8b, v2.8b }, [x27], #16
1382 # CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1
1383 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.8h, v2.8h }, [x27], #32
1384 # CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1
1385 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1 { v1.16b, v2.16b }, [x27], #32
1386 # CHECK-NEXT: 7. 1 1.0 0.0 4.0 add x0, x27, #1
1387 # CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld1 { v1.1d, v2.1d }, [x27], x28
1388 # CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1
1389 # CHECK-NEXT: 1 1.4 0.4 1.8 <total>
1391 # CHECK: [5] Code Region - G06
1393 # CHECK: Iterations: 100
1394 # CHECK-NEXT: Instructions: 1000
1395 # CHECK-NEXT: Total Cycles: 707
1396 # CHECK-NEXT: Total uOps: 1700
1398 # CHECK: Dispatch Width: 3
1399 # CHECK-NEXT: uOps Per Cycle: 2.40
1400 # CHECK-NEXT: IPC: 1.41
1401 # CHECK-NEXT: Block RThroughput: 7.0
1403 # CHECK: Timeline view:
1405 # CHECK-NEXT: Index 0123456789
1407 # CHECK: [0,0] DeeeeeeER . . ld1 { v1.2d, v2.2d }, [x27], x28
1408 # CHECK-NEXT: [0,1] .DeE----R . . add x0, x27, #1
1409 # CHECK-NEXT: [0,2] .D=eeeeeER. . ld1 { v1.2s, v2.2s }, [x27], x28
1410 # CHECK-NEXT: [0,3] . D=eE---R. . add x0, x27, #1
1411 # CHECK-NEXT: [0,4] . D=eeeeeER . ld1 { v1.4h, v2.4h }, [x27], x28
1412 # CHECK-NEXT: [0,5] . D=eE---R . add x0, x27, #1
1413 # CHECK-NEXT: [0,6] . DeeeeeeER. ld1 { v1.4s, v2.4s }, [x27], x28
1414 # CHECK-NEXT: [0,7] . DeE----R. add x0, x27, #1
1415 # CHECK-NEXT: [0,8] . D=eeeeeER ld1 { v1.8b, v2.8b }, [x27], x28
1416 # CHECK-NEXT: [0,9] . .D=eE---R add x0, x27, #1
1418 # CHECK: Average Wait times (based on the timeline view):
1419 # CHECK-NEXT: [0]: Executions
1420 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1421 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1422 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1424 # CHECK: [0] [1] [2] [3]
1425 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2d, v2.2d }, [x27], x28
1426 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
1427 # CHECK-NEXT: 2. 1 2.0 1.0 0.0 ld1 { v1.2s, v2.2s }, [x27], x28
1428 # CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1
1429 # CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld1 { v1.4h, v2.4h }, [x27], x28
1430 # CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1
1431 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld1 { v1.4s, v2.4s }, [x27], x28
1432 # CHECK-NEXT: 7. 1 1.0 0.0 4.0 add x0, x27, #1
1433 # CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld1 { v1.8b, v2.8b }, [x27], x28
1434 # CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1
1435 # CHECK-NEXT: 1 1.6 0.3 1.7 <total>
1437 # CHECK: [6] Code Region - G07
1439 # CHECK: Iterations: 100
1440 # CHECK-NEXT: Instructions: 1000
1441 # CHECK-NEXT: Total Cycles: 1107
1442 # CHECK-NEXT: Total uOps: 2100
1444 # CHECK: Dispatch Width: 3
1445 # CHECK-NEXT: uOps Per Cycle: 1.90
1446 # CHECK-NEXT: IPC: 0.90
1447 # CHECK-NEXT: Block RThroughput: 11.0
1449 # CHECK: Timeline view:
1450 # CHECK-NEXT: 01234567
1451 # CHECK-NEXT: Index 0123456789
1453 # CHECK: [0,0] DeeeeeeER . . . ld1 { v1.8h, v2.8h }, [x27], x28
1454 # CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1
1455 # CHECK-NEXT: [0,2] . DeeeeeeER . . ld1 { v1.16b, v2.16b }, [x27], x28
1456 # CHECK-NEXT: [0,3] . DeE----R . . add x0, x27, #1
1457 # CHECK-NEXT: [0,4] . DeeeeeeER . . ld1 { v1.1d, v2.1d, v3.1d }, [x27], #24
1458 # CHECK-NEXT: [0,5] . DeE----R . . add x0, x27, #1
1459 # CHECK-NEXT: [0,6] . .DeeeeeeeER . ld1 { v1.2d, v2.2d, v3.2d }, [x27], #48
1460 # CHECK-NEXT: [0,7] . . DeE-----R . add x0, x27, #1
1461 # CHECK-NEXT: [0,8] . . D=eeeeeeER ld1 { v1.2s, v2.2s, v3.2s }, [x27], #24
1462 # CHECK-NEXT: [0,9] . . D=eE----R add x0, x27, #1
1464 # CHECK: Average Wait times (based on the timeline view):
1465 # CHECK-NEXT: [0]: Executions
1466 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1467 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1468 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1470 # CHECK: [0] [1] [2] [3]
1471 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8h, v2.8h }, [x27], x28
1472 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
1473 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.16b, v2.16b }, [x27], x28
1474 # CHECK-NEXT: 3. 1 1.0 0.0 4.0 add x0, x27, #1
1475 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld1 { v1.1d, v2.1d, v3.1d }, [x27], #24
1476 # CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1
1477 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1 { v1.2d, v2.2d, v3.2d }, [x27], #48
1478 # CHECK-NEXT: 7. 1 1.0 0.0 5.0 add x0, x27, #1
1479 # CHECK-NEXT: 8. 1 2.0 2.0 0.0 ld1 { v1.2s, v2.2s, v3.2s }, [x27], #24
1480 # CHECK-NEXT: 9. 1 2.0 0.0 4.0 add x0, x27, #1
1481 # CHECK-NEXT: 1 1.2 0.6 2.1 <total>
1483 # CHECK: [7] Code Region - G08
1485 # CHECK: Iterations: 100
1486 # CHECK-NEXT: Instructions: 1000
1487 # CHECK-NEXT: Total Cycles: 1307
1488 # CHECK-NEXT: Total uOps: 2300
1490 # CHECK: Dispatch Width: 3
1491 # CHECK-NEXT: uOps Per Cycle: 1.76
1492 # CHECK-NEXT: IPC: 0.77
1493 # CHECK-NEXT: Block RThroughput: 13.0
1495 # CHECK: Timeline view:
1496 # CHECK-NEXT: 0123456789
1497 # CHECK-NEXT: Index 0123456789
1499 # CHECK: [0,0] DeeeeeeER . . . ld1 { v1.4h, v2.4h, v3.4h }, [x27], #24
1500 # CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1
1501 # CHECK-NEXT: [0,2] . DeeeeeeeER . . ld1 { v1.4s, v2.4s, v3.4s }, [x27], #48
1502 # CHECK-NEXT: [0,3] . DeE-----R . . add x0, x27, #1
1503 # CHECK-NEXT: [0,4] . D=eeeeeeER . . ld1 { v1.8b, v2.8b, v3.8b }, [x27], #24
1504 # CHECK-NEXT: [0,5] . D=eE----R . . add x0, x27, #1
1505 # CHECK-NEXT: [0,6] . .D=eeeeeeeER . ld1 { v1.8h, v2.8h, v3.8h }, [x27], #48
1506 # CHECK-NEXT: [0,7] . . D=eE-----R . add x0, x27, #1
1507 # CHECK-NEXT: [0,8] . . D==eeeeeeeER ld1 { v1.16b, v2.16b, v3.16b }, [x27], #48
1508 # CHECK-NEXT: [0,9] . . D==eE-----R add x0, x27, #1
1510 # CHECK: Average Wait times (based on the timeline view):
1511 # CHECK-NEXT: [0]: Executions
1512 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1513 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1514 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1516 # CHECK: [0] [1] [2] [3]
1517 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h }, [x27], #24
1518 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
1519 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s }, [x27], #48
1520 # CHECK-NEXT: 3. 1 1.0 0.0 5.0 add x0, x27, #1
1521 # CHECK-NEXT: 4. 1 2.0 2.0 0.0 ld1 { v1.8b, v2.8b, v3.8b }, [x27], #24
1522 # CHECK-NEXT: 5. 1 2.0 0.0 4.0 add x0, x27, #1
1523 # CHECK-NEXT: 6. 1 2.0 1.0 0.0 ld1 { v1.8h, v2.8h, v3.8h }, [x27], #48
1524 # CHECK-NEXT: 7. 1 2.0 0.0 5.0 add x0, x27, #1
1525 # CHECK-NEXT: 8. 1 3.0 2.0 0.0 ld1 { v1.16b, v2.16b, v3.16b }, [x27], #48
1526 # CHECK-NEXT: 9. 1 3.0 0.0 5.0 add x0, x27, #1
1527 # CHECK-NEXT: 1 1.8 0.7 2.3 <total>
1529 # CHECK: [8] Code Region - G09
1531 # CHECK: Iterations: 100
1532 # CHECK-NEXT: Instructions: 1000
1533 # CHECK-NEXT: Total Cycles: 1207
1534 # CHECK-NEXT: Total uOps: 2200
1536 # CHECK: Dispatch Width: 3
1537 # CHECK-NEXT: uOps Per Cycle: 1.82
1538 # CHECK-NEXT: IPC: 0.83
1539 # CHECK-NEXT: Block RThroughput: 12.0
1541 # CHECK: Timeline view:
1542 # CHECK-NEXT: 012345678
1543 # CHECK-NEXT: Index 0123456789
1545 # CHECK: [0,0] DeeeeeeER . . . ld1 { v1.1d, v2.1d, v3.1d }, [x27], x28
1546 # CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1
1547 # CHECK-NEXT: [0,2] . DeeeeeeeER . . ld1 { v1.2d, v2.2d, v3.2d }, [x27], x28
1548 # CHECK-NEXT: [0,3] . DeE-----R . . add x0, x27, #1
1549 # CHECK-NEXT: [0,4] . D=eeeeeeER . . ld1 { v1.2s, v2.2s, v3.2s }, [x27], x28
1550 # CHECK-NEXT: [0,5] . D=eE----R . . add x0, x27, #1
1551 # CHECK-NEXT: [0,6] . .D=eeeeeeER . ld1 { v1.4h, v2.4h, v3.4h }, [x27], x28
1552 # CHECK-NEXT: [0,7] . . D=eE----R . add x0, x27, #1
1553 # CHECK-NEXT: [0,8] . . D=eeeeeeeER ld1 { v1.4s, v2.4s, v3.4s }, [x27], x28
1554 # CHECK-NEXT: [0,9] . . D=eE-----R add x0, x27, #1
1556 # CHECK: Average Wait times (based on the timeline view):
1557 # CHECK-NEXT: [0]: Executions
1558 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1559 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1560 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1562 # CHECK: [0] [1] [2] [3]
1563 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.1d, v2.1d, v3.1d }, [x27], x28
1564 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
1565 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.2d, v2.2d, v3.2d }, [x27], x28
1566 # CHECK-NEXT: 3. 1 1.0 0.0 5.0 add x0, x27, #1
1567 # CHECK-NEXT: 4. 1 2.0 2.0 0.0 ld1 { v1.2s, v2.2s, v3.2s }, [x27], x28
1568 # CHECK-NEXT: 5. 1 2.0 0.0 4.0 add x0, x27, #1
1569 # CHECK-NEXT: 6. 1 2.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h }, [x27], x28
1570 # CHECK-NEXT: 7. 1 2.0 0.0 4.0 add x0, x27, #1
1571 # CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s }, [x27], x28
1572 # CHECK-NEXT: 9. 1 2.0 0.0 5.0 add x0, x27, #1
1573 # CHECK-NEXT: 1 1.6 0.6 2.2 <total>
1575 # CHECK: [9] Code Region - G10
1577 # CHECK: Iterations: 100
1578 # CHECK-NEXT: Instructions: 1000
1579 # CHECK-NEXT: Total Cycles: 1407
1580 # CHECK-NEXT: Total uOps: 2400
1582 # CHECK: Dispatch Width: 3
1583 # CHECK-NEXT: uOps Per Cycle: 1.71
1584 # CHECK-NEXT: IPC: 0.71
1585 # CHECK-NEXT: Block RThroughput: 14.0
1587 # CHECK: Timeline view:
1588 # CHECK-NEXT: 0123456789
1589 # CHECK-NEXT: Index 0123456789 0
1591 # CHECK: [0,0] DeeeeeeER . . . ld1 { v1.8b, v2.8b, v3.8b }, [x27], x28
1592 # CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1
1593 # CHECK-NEXT: [0,2] . DeeeeeeeER . . ld1 { v1.8h, v2.8h, v3.8h }, [x27], x28
1594 # CHECK-NEXT: [0,3] . DeE-----R . . add x0, x27, #1
1595 # CHECK-NEXT: [0,4] . D=eeeeeeeER. . ld1 { v1.16b, v2.16b, v3.16b }, [x27], x28
1596 # CHECK-NEXT: [0,5] . D=eE-----R. . add x0, x27, #1
1597 # CHECK-NEXT: [0,6] . .D==eeeeeeER . ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
1598 # CHECK-NEXT: [0,7] . . D==eE----R . add x0, x27, #1
1599 # CHECK-NEXT: [0,8] . . D==eeeeeeeeER ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
1600 # CHECK-NEXT: [0,9] . . D==eE------R add x0, x27, #1
1602 # CHECK: Average Wait times (based on the timeline view):
1603 # CHECK-NEXT: [0]: Executions
1604 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1605 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1606 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1608 # CHECK: [0] [1] [2] [3]
1609 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8b, v2.8b, v3.8b }, [x27], x28
1610 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
1611 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.8h, v2.8h, v3.8h }, [x27], x28
1612 # CHECK-NEXT: 3. 1 1.0 0.0 5.0 add x0, x27, #1
1613 # CHECK-NEXT: 4. 1 2.0 2.0 0.0 ld1 { v1.16b, v2.16b, v3.16b }, [x27], x28
1614 # CHECK-NEXT: 5. 1 2.0 0.0 5.0 add x0, x27, #1
1615 # CHECK-NEXT: 6. 1 3.0 2.0 0.0 ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
1616 # CHECK-NEXT: 7. 1 3.0 0.0 4.0 add x0, x27, #1
1617 # CHECK-NEXT: 8. 1 3.0 1.0 0.0 ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
1618 # CHECK-NEXT: 9. 1 3.0 0.0 6.0 add x0, x27, #1
1619 # CHECK-NEXT: 1 2.0 0.7 2.4 <total>
1621 # CHECK: [10] Code Region - G11
1623 # CHECK: Iterations: 100
1624 # CHECK-NEXT: Instructions: 1000
1625 # CHECK-NEXT: Total Cycles: 1407
1626 # CHECK-NEXT: Total uOps: 2400
1628 # CHECK: Dispatch Width: 3
1629 # CHECK-NEXT: uOps Per Cycle: 1.71
1630 # CHECK-NEXT: IPC: 0.71
1631 # CHECK-NEXT: Block RThroughput: 14.0
1633 # CHECK: Timeline view:
1634 # CHECK-NEXT: 0123456789
1635 # CHECK-NEXT: Index 0123456789 0
1637 # CHECK: [0,0] DeeeeeeER . . . ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
1638 # CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1
1639 # CHECK-NEXT: [0,2] . DeeeeeeER . . ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
1640 # CHECK-NEXT: [0,3] . DeE----R . . add x0, x27, #1
1641 # CHECK-NEXT: [0,4] . DeeeeeeeeER. . ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
1642 # CHECK-NEXT: [0,5] . DeE------R. . add x0, x27, #1
1643 # CHECK-NEXT: [0,6] . .D==eeeeeeER . ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
1644 # CHECK-NEXT: [0,7] . . D==eE----R . add x0, x27, #1
1645 # CHECK-NEXT: [0,8] . . D==eeeeeeeeER ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
1646 # CHECK-NEXT: [0,9] . . D==eE------R add x0, x27, #1
1648 # CHECK: Average Wait times (based on the timeline view):
1649 # CHECK-NEXT: [0]: Executions
1650 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1651 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1652 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1654 # CHECK: [0] [1] [2] [3]
1655 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
1656 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
1657 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
1658 # CHECK-NEXT: 3. 1 1.0 0.0 4.0 add x0, x27, #1
1659 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
1660 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
1661 # CHECK-NEXT: 6. 1 3.0 3.0 0.0 ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
1662 # CHECK-NEXT: 7. 1 3.0 0.0 4.0 add x0, x27, #1
1663 # CHECK-NEXT: 8. 1 3.0 1.0 0.0 ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
1664 # CHECK-NEXT: 9. 1 3.0 0.0 6.0 add x0, x27, #1
1665 # CHECK-NEXT: 1 1.8 0.7 2.4 <total>
1667 # CHECK: [11] Code Region - G12
1669 # CHECK: Iterations: 100
1670 # CHECK-NEXT: Instructions: 1000
1671 # CHECK-NEXT: Total Cycles: 1407
1672 # CHECK-NEXT: Total uOps: 2400
1674 # CHECK: Dispatch Width: 3
1675 # CHECK-NEXT: uOps Per Cycle: 1.71
1676 # CHECK-NEXT: IPC: 0.71
1677 # CHECK-NEXT: Block RThroughput: 14.0
1679 # CHECK: Timeline view:
1680 # CHECK-NEXT: 0123456789
1681 # CHECK-NEXT: Index 0123456789 0
1683 # CHECK: [0,0] DeeeeeeeeER . . ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
1684 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
1685 # CHECK-NEXT: [0,2] . D==eeeeeeER . . ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
1686 # CHECK-NEXT: [0,3] . D==eE----R . . add x0, x27, #1
1687 # CHECK-NEXT: [0,4] . D==eeeeeeeeER . ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
1688 # CHECK-NEXT: [0,5] . D==eE------R . add x0, x27, #1
1689 # CHECK-NEXT: [0,6] . .D====eeeeeeER . ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
1690 # CHECK-NEXT: [0,7] . . D====eE----R . add x0, x27, #1
1691 # CHECK-NEXT: [0,8] . . D====eeeeeeER ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
1692 # CHECK-NEXT: [0,9] . . D====eE----R add x0, x27, #1
1694 # CHECK: Average Wait times (based on the timeline view):
1695 # CHECK-NEXT: [0]: Executions
1696 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1697 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1698 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1700 # CHECK: [0] [1] [2] [3]
1701 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
1702 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
1703 # CHECK-NEXT: 2. 1 3.0 3.0 0.0 ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
1704 # CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1
1705 # CHECK-NEXT: 4. 1 3.0 1.0 0.0 ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
1706 # CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1
1707 # CHECK-NEXT: 6. 1 5.0 3.0 0.0 ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
1708 # CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1
1709 # CHECK-NEXT: 8. 1 5.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
1710 # CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1
1711 # CHECK-NEXT: 1 3.4 0.9 2.4 <total>
1713 # CHECK: [12] Code Region - G13
1715 # CHECK: Iterations: 100
1716 # CHECK-NEXT: Instructions: 1000
1717 # CHECK-NEXT: Total Cycles: 1910
1718 # CHECK-NEXT: Total uOps: 2600
1720 # CHECK: Dispatch Width: 3
1721 # CHECK-NEXT: uOps Per Cycle: 1.36
1722 # CHECK-NEXT: IPC: 0.52
1723 # CHECK-NEXT: Block RThroughput: 15.0
1725 # CHECK: Timeline view:
1726 # CHECK-NEXT: 0123456789
1727 # CHECK-NEXT: Index 0123456789 012345678
1729 # CHECK: [0,0] DeeeeeeeeER . . . . ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
1730 # CHECK-NEXT: [0,1] .DeE------R . . . . add x0, x27, #1
1731 # CHECK-NEXT: [0,2] . D==eeeeeeER . . . . ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
1732 # CHECK-NEXT: [0,3] . D==eE----R . . . . add x0, x27, #1
1733 # CHECK-NEXT: [0,4] . D==eeeeeeeeER . . . ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
1734 # CHECK-NEXT: [0,5] . D==eE------R . . . add x0, x27, #1
1735 # CHECK-NEXT: [0,6] . .D====eeeeeeeeER . . ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
1736 # CHECK-NEXT: [0,7] . . D====eE------R . . add x0, x27, #1
1737 # CHECK-NEXT: [0,8] . . D==========eeeeeeeeER ld1 { v1.b }[0], [x27], #1
1738 # CHECK-NEXT: [0,9] . . D==========eE------R add x0, x27, #1
1740 # CHECK: Average Wait times (based on the timeline view):
1741 # CHECK-NEXT: [0]: Executions
1742 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1743 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1744 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1746 # CHECK: [0] [1] [2] [3]
1747 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
1748 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
1749 # CHECK-NEXT: 2. 1 3.0 3.0 0.0 ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
1750 # CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1
1751 # CHECK-NEXT: 4. 1 3.0 1.0 0.0 ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
1752 # CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1
1753 # CHECK-NEXT: 6. 1 5.0 3.0 0.0 ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
1754 # CHECK-NEXT: 7. 1 5.0 0.0 6.0 add x0, x27, #1
1755 # CHECK-NEXT: 8. 1 11.0 0.0 0.0 ld1 { v1.b }[0], [x27], #1
1756 # CHECK-NEXT: 9. 1 11.0 0.0 6.0 add x0, x27, #1
1757 # CHECK-NEXT: 1 4.6 0.8 2.8 <total>
1759 # CHECK: [13] Code Region - G14
1761 # CHECK: Iterations: 100
1762 # CHECK-NEXT: Instructions: 1000
1763 # CHECK-NEXT: Total Cycles: 4003
1764 # CHECK-NEXT: Total uOps: 2000
1766 # CHECK: Dispatch Width: 3
1767 # CHECK-NEXT: uOps Per Cycle: 0.50
1768 # CHECK-NEXT: IPC: 0.25
1769 # CHECK-NEXT: Block RThroughput: 6.7
1771 # CHECK: Timeline view:
1772 # CHECK-NEXT: 0123456789 0123456789
1773 # CHECK-NEXT: Index 0123456789 0123456789 012
1775 # CHECK: [0,0] DeeeeeeeeER . . . . . . . ld1 { v1.b }[8], [x27], #1
1776 # CHECK-NEXT: [0,1] .DeE------R . . . . . . . add x0, x27, #1
1777 # CHECK-NEXT: [0,2] . D======eeeeeeeeER . . . . . . ld1 { v1.b }[0], [x27], x28
1778 # CHECK-NEXT: [0,3] . D======eE------R . . . . . . add x0, x27, #1
1779 # CHECK-NEXT: [0,4] . D============eeeeeeeeER . . . . ld1 { v1.b }[8], [x27], x28
1780 # CHECK-NEXT: [0,5] . D============eE------R . . . . add x0, x27, #1
1781 # CHECK-NEXT: [0,6] . .D==================eeeeeeeeER. . . ld1 { v1.h }[0], [x27], #2
1782 # CHECK-NEXT: [0,7] . . D==================eE------R. . . add x0, x27, #1
1783 # CHECK-NEXT: [0,8] . . D========================eeeeeeeeER ld1 { v1.h }[4], [x27], #2
1784 # CHECK-NEXT: [0,9] . . D========================eE------R add x0, x27, #1
1786 # CHECK: Average Wait times (based on the timeline view):
1787 # CHECK-NEXT: [0]: Executions
1788 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1789 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1790 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1792 # CHECK: [0] [1] [2] [3]
1793 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.b }[8], [x27], #1
1794 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
1795 # CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld1 { v1.b }[0], [x27], x28
1796 # CHECK-NEXT: 3. 1 7.0 0.0 6.0 add x0, x27, #1
1797 # CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld1 { v1.b }[8], [x27], x28
1798 # CHECK-NEXT: 5. 1 13.0 0.0 6.0 add x0, x27, #1
1799 # CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld1 { v1.h }[0], [x27], #2
1800 # CHECK-NEXT: 7. 1 19.0 0.0 6.0 add x0, x27, #1
1801 # CHECK-NEXT: 8. 1 25.0 0.0 0.0 ld1 { v1.h }[4], [x27], #2
1802 # CHECK-NEXT: 9. 1 25.0 0.0 6.0 add x0, x27, #1
1803 # CHECK-NEXT: 1 13.0 0.1 3.0 <total>
1805 # CHECK: [14] Code Region - G15
1807 # CHECK: Iterations: 100
1808 # CHECK-NEXT: Instructions: 1000
1809 # CHECK-NEXT: Total Cycles: 3703
1810 # CHECK-NEXT: Total uOps: 1900
1812 # CHECK: Dispatch Width: 3
1813 # CHECK-NEXT: uOps Per Cycle: 0.51
1814 # CHECK-NEXT: IPC: 0.27
1815 # CHECK-NEXT: Block RThroughput: 6.3
1817 # CHECK: Timeline view:
1818 # CHECK-NEXT: 0123456789 0123456789
1819 # CHECK-NEXT: Index 0123456789 0123456789
1821 # CHECK: [0,0] DeeeeeeeeER . . . . . . ld1 { v1.h }[0], [x27], x28
1822 # CHECK-NEXT: [0,1] .DeE------R . . . . . . add x0, x27, #1
1823 # CHECK-NEXT: [0,2] . D======eeeeeeeeER . . . . . ld1 { v1.h }[4], [x27], x28
1824 # CHECK-NEXT: [0,3] . D======eE------R . . . . . add x0, x27, #1
1825 # CHECK-NEXT: [0,4] . D============eeeeeeeeER . . . ld1 { v1.s }[0], [x27], #4
1826 # CHECK-NEXT: [0,5] . D============eE------R . . . add x0, x27, #1
1827 # CHECK-NEXT: [0,6] . .D==================eeeeeeeeER. . ld1 { v1.s }[0], [x27], x28
1828 # CHECK-NEXT: [0,7] . . D==================eE------R. . add x0, x27, #1
1829 # CHECK-NEXT: [0,8] . . D=========================eeeeeER ld1 { v1.d }[0], [x27], #8
1830 # CHECK-NEXT: [0,9] . . D=========================eE---R add x0, x27, #1
1832 # CHECK: Average Wait times (based on the timeline view):
1833 # CHECK-NEXT: [0]: Executions
1834 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1835 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1836 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1838 # CHECK: [0] [1] [2] [3]
1839 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.h }[0], [x27], x28
1840 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
1841 # CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld1 { v1.h }[4], [x27], x28
1842 # CHECK-NEXT: 3. 1 7.0 0.0 6.0 add x0, x27, #1
1843 # CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld1 { v1.s }[0], [x27], #4
1844 # CHECK-NEXT: 5. 1 13.0 0.0 6.0 add x0, x27, #1
1845 # CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld1 { v1.s }[0], [x27], x28
1846 # CHECK-NEXT: 7. 1 19.0 0.0 6.0 add x0, x27, #1
1847 # CHECK-NEXT: 8. 1 26.0 0.0 0.0 ld1 { v1.d }[0], [x27], #8
1848 # CHECK-NEXT: 9. 1 26.0 0.0 3.0 add x0, x27, #1
1849 # CHECK-NEXT: 1 13.2 0.1 2.7 <total>
1851 # CHECK: [15] Code Region - G16
1853 # CHECK: Iterations: 100
1854 # CHECK-NEXT: Instructions: 1000
1855 # CHECK-NEXT: Total Cycles: 1205
1856 # CHECK-NEXT: Total uOps: 1800
1858 # CHECK: Dispatch Width: 3
1859 # CHECK-NEXT: uOps Per Cycle: 1.49
1860 # CHECK-NEXT: IPC: 0.83
1861 # CHECK-NEXT: Block RThroughput: 6.0
1863 # CHECK: Timeline view:
1864 # CHECK-NEXT: 0123456
1865 # CHECK-NEXT: Index 0123456789
1867 # CHECK: [0,0] DeeeeeER . .. ld1 { v1.d }[0], [x27], x28
1868 # CHECK-NEXT: [0,1] D=eE---R . .. add x0, x27, #1
1869 # CHECK-NEXT: [0,2] .DeeeeeER . .. ld1r { v1.1d }, [x27], #8
1870 # CHECK-NEXT: [0,3] .D=eE---R . .. add x0, x27, #1
1871 # CHECK-NEXT: [0,4] . DeeeeeeeeER .. ld1r { v1.2d }, [x27], #8
1872 # CHECK-NEXT: [0,5] . DeE------R .. add x0, x27, #1
1873 # CHECK-NEXT: [0,6] . DeeeeeeeeER.. ld1r { v1.2s }, [x27], #4
1874 # CHECK-NEXT: [0,7] . DeE------R.. add x0, x27, #1
1875 # CHECK-NEXT: [0,8] . .DeeeeeeeeER ld1r { v1.4h }, [x27], #2
1876 # CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1
1878 # CHECK: Average Wait times (based on the timeline view):
1879 # CHECK-NEXT: [0]: Executions
1880 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1881 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1882 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1884 # CHECK: [0] [1] [2] [3]
1885 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.d }[0], [x27], x28
1886 # CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1
1887 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1r { v1.1d }, [x27], #8
1888 # CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1
1889 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1r { v1.2d }, [x27], #8
1890 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
1891 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1r { v1.2s }, [x27], #4
1892 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
1893 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld1r { v1.4h }, [x27], #2
1894 # CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1
1895 # CHECK-NEXT: 1 1.2 0.3 2.4 <total>
1897 # CHECK: [16] Code Region - G17
1899 # CHECK: Iterations: 100
1900 # CHECK-NEXT: Instructions: 1000
1901 # CHECK-NEXT: Total Cycles: 908
1902 # CHECK-NEXT: Total uOps: 1900
1904 # CHECK: Dispatch Width: 3
1905 # CHECK-NEXT: uOps Per Cycle: 2.09
1906 # CHECK-NEXT: IPC: 1.10
1907 # CHECK-NEXT: Block RThroughput: 6.3
1909 # CHECK: Timeline view:
1910 # CHECK-NEXT: 0123456
1911 # CHECK-NEXT: Index 0123456789
1913 # CHECK: [0,0] DeeeeeeeeER .. ld1r { v1.4s }, [x27], #4
1914 # CHECK-NEXT: [0,1] .DeE------R .. add x0, x27, #1
1915 # CHECK-NEXT: [0,2] . DeeeeeeeeER .. ld1r { v1.8b }, [x27], #1
1916 # CHECK-NEXT: [0,3] . DeE------R .. add x0, x27, #1
1917 # CHECK-NEXT: [0,4] . DeeeeeeeeER.. ld1r { v1.8h }, [x27], #2
1918 # CHECK-NEXT: [0,5] . DeE------R.. add x0, x27, #1
1919 # CHECK-NEXT: [0,6] . .DeeeeeeeeER ld1r { v1.16b }, [x27], #1
1920 # CHECK-NEXT: [0,7] . . DeE------R add x0, x27, #1
1921 # CHECK-NEXT: [0,8] . . DeeeeeE--R ld1r { v1.1d }, [x27], x28
1922 # CHECK-NEXT: [0,9] . . DeE-----R add x0, x27, #1
1924 # CHECK: Average Wait times (based on the timeline view):
1925 # CHECK-NEXT: [0]: Executions
1926 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1927 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1928 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1930 # CHECK: [0] [1] [2] [3]
1931 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.4s }, [x27], #4
1932 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
1933 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1r { v1.8b }, [x27], #1
1934 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
1935 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld1r { v1.8h }, [x27], #2
1936 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
1937 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1r { v1.16b }, [x27], #1
1938 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
1939 # CHECK-NEXT: 8. 1 1.0 0.0 2.0 ld1r { v1.1d }, [x27], x28
1940 # CHECK-NEXT: 9. 1 1.0 0.0 5.0 add x0, x27, #1
1941 # CHECK-NEXT: 1 1.0 0.4 3.1 <total>
1943 # CHECK: [17] Code Region - G18
1945 # CHECK: Iterations: 100
1946 # CHECK-NEXT: Instructions: 1000
1947 # CHECK-NEXT: Total Cycles: 1009
1948 # CHECK-NEXT: Total uOps: 2000
1950 # CHECK: Dispatch Width: 3
1951 # CHECK-NEXT: uOps Per Cycle: 1.98
1952 # CHECK-NEXT: IPC: 0.99
1953 # CHECK-NEXT: Block RThroughput: 6.7
1955 # CHECK: Timeline view:
1956 # CHECK-NEXT: 012345678
1957 # CHECK-NEXT: Index 0123456789
1959 # CHECK: [0,0] DeeeeeeeeER . . ld1r { v1.2d }, [x27], x28
1960 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
1961 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld1r { v1.2s }, [x27], x28
1962 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
1963 # CHECK-NEXT: [0,4] . DeeeeeeeeER. . ld1r { v1.4h }, [x27], x28
1964 # CHECK-NEXT: [0,5] . DeE------R. . add x0, x27, #1
1965 # CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld1r { v1.4s }, [x27], x28
1966 # CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1
1967 # CHECK-NEXT: [0,8] . . DeeeeeeeeER ld1r { v1.8b }, [x27], x28
1968 # CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1
1970 # CHECK: Average Wait times (based on the timeline view):
1971 # CHECK-NEXT: [0]: Executions
1972 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1973 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1974 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1976 # CHECK: [0] [1] [2] [3]
1977 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.2d }, [x27], x28
1978 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
1979 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1r { v1.2s }, [x27], x28
1980 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
1981 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld1r { v1.4h }, [x27], x28
1982 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
1983 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1r { v1.4s }, [x27], x28
1984 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
1985 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld1r { v1.8b }, [x27], x28
1986 # CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1
1987 # CHECK-NEXT: 1 1.0 0.5 3.0 <total>
1989 # CHECK: [18] Code Region - G19
1991 # CHECK: Iterations: 100
1992 # CHECK-NEXT: Instructions: 1000
1993 # CHECK-NEXT: Total Cycles: 1009
1994 # CHECK-NEXT: Total uOps: 2000
1996 # CHECK: Dispatch Width: 3
1997 # CHECK-NEXT: uOps Per Cycle: 1.98
1998 # CHECK-NEXT: IPC: 0.99
1999 # CHECK-NEXT: Block RThroughput: 6.7
2001 # CHECK: Timeline view:
2002 # CHECK-NEXT: 012345678
2003 # CHECK-NEXT: Index 0123456789
2005 # CHECK: [0,0] DeeeeeeeeER . . ld1r { v1.8h }, [x27], x28
2006 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
2007 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld1r { v1.16b }, [x27], x28
2008 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
2009 # CHECK-NEXT: [0,4] . DeeeeeeER . . ld2 { v1.2d, v2.2d }, [x27], #32
2010 # CHECK-NEXT: [0,5] . DeE----R . . add x0, x27, #1
2011 # CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld2 { v1.2s, v2.2s }, [x27], #16
2012 # CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1
2013 # CHECK-NEXT: [0,8] . . DeeeeeeeeER ld2 { v1.4h, v2.4h }, [x27], #16
2014 # CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1
2016 # CHECK: Average Wait times (based on the timeline view):
2017 # CHECK-NEXT: [0]: Executions
2018 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2019 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2020 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2022 # CHECK: [0] [1] [2] [3]
2023 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.8h }, [x27], x28
2024 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
2025 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1r { v1.16b }, [x27], x28
2026 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
2027 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2 { v1.2d, v2.2d }, [x27], #32
2028 # CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1
2029 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2 { v1.2s, v2.2s }, [x27], #16
2030 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
2031 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld2 { v1.4h, v2.4h }, [x27], #16
2032 # CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1
2033 # CHECK-NEXT: 1 1.0 0.5 2.8 <total>
2035 # CHECK: [19] Code Region - G20
2037 # CHECK: Iterations: 100
2038 # CHECK-NEXT: Instructions: 1000
2039 # CHECK-NEXT: Total Cycles: 1008
2040 # CHECK-NEXT: Total uOps: 2600
2042 # CHECK: Dispatch Width: 3
2043 # CHECK-NEXT: uOps Per Cycle: 2.58
2044 # CHECK-NEXT: IPC: 0.99
2045 # CHECK-NEXT: Block RThroughput: 9.0
2047 # CHECK: Timeline view:
2048 # CHECK-NEXT: 01234567
2049 # CHECK-NEXT: Index 0123456789
2051 # CHECK: [0,0] DeeeeeeeeeER . . ld2 { v1.4s, v2.4s }, [x27], #32
2052 # CHECK-NEXT: [0,1] .DeE-------R . . add x0, x27, #1
2053 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld2 { v1.8b, v2.8b }, [x27], #16
2054 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
2055 # CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld2 { v1.8h, v2.8h }, [x27], #32
2056 # CHECK-NEXT: [0,5] . DeE-------R . add x0, x27, #1
2057 # CHECK-NEXT: [0,6] . .DeeeeeeeeeER ld2 { v1.16b, v2.16b }, [x27], #32
2058 # CHECK-NEXT: [0,7] . . DeE-------R add x0, x27, #1
2059 # CHECK-NEXT: [0,8] . . DeeeeeeE-R ld2 { v1.2d, v2.2d }, [x27], x28
2060 # CHECK-NEXT: [0,9] . . DeE-----R add x0, x27, #1
2062 # CHECK: Average Wait times (based on the timeline view):
2063 # CHECK-NEXT: [0]: Executions
2064 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2065 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2066 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2068 # CHECK: [0] [1] [2] [3]
2069 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.4s, v2.4s }, [x27], #32
2070 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2071 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld2 { v1.8b, v2.8b }, [x27], #16
2072 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
2073 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2 { v1.8h, v2.8h }, [x27], #32
2074 # CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1
2075 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2 { v1.16b, v2.16b }, [x27], #32
2076 # CHECK-NEXT: 7. 1 1.0 0.0 7.0 add x0, x27, #1
2077 # CHECK-NEXT: 8. 1 1.0 1.0 1.0 ld2 { v1.2d, v2.2d }, [x27], x28
2078 # CHECK-NEXT: 9. 1 1.0 0.0 5.0 add x0, x27, #1
2079 # CHECK-NEXT: 1 1.0 0.5 3.3 <total>
2081 # CHECK: [20] Code Region - G21
2083 # CHECK: Iterations: 100
2084 # CHECK-NEXT: Instructions: 1000
2085 # CHECK-NEXT: Total Cycles: 1010
2086 # CHECK-NEXT: Total uOps: 2400
2088 # CHECK: Dispatch Width: 3
2089 # CHECK-NEXT: uOps Per Cycle: 2.38
2090 # CHECK-NEXT: IPC: 0.99
2091 # CHECK-NEXT: Block RThroughput: 8.0
2093 # CHECK: Timeline view:
2094 # CHECK-NEXT: 0123456789
2095 # CHECK-NEXT: Index 0123456789
2097 # CHECK: [0,0] DeeeeeeeeER . . ld2 { v1.2s, v2.2s }, [x27], x28
2098 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
2099 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld2 { v1.4h, v2.4h }, [x27], x28
2100 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
2101 # CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld2 { v1.4s, v2.4s }, [x27], x28
2102 # CHECK-NEXT: [0,5] . DeE-------R . add x0, x27, #1
2103 # CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld2 { v1.8b, v2.8b }, [x27], x28
2104 # CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1
2105 # CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld2 { v1.8h, v2.8h }, [x27], x28
2106 # CHECK-NEXT: [0,9] . . DeE-------R add x0, x27, #1
2108 # CHECK: Average Wait times (based on the timeline view):
2109 # CHECK-NEXT: [0]: Executions
2110 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2111 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2112 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2114 # CHECK: [0] [1] [2] [3]
2115 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.2s, v2.2s }, [x27], x28
2116 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
2117 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld2 { v1.4h, v2.4h }, [x27], x28
2118 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
2119 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2 { v1.4s, v2.4s }, [x27], x28
2120 # CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1
2121 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2 { v1.8b, v2.8b }, [x27], x28
2122 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
2123 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld2 { v1.8h, v2.8h }, [x27], x28
2124 # CHECK-NEXT: 9. 1 1.0 0.0 7.0 add x0, x27, #1
2125 # CHECK-NEXT: 1 1.0 0.5 3.2 <total>
2127 # CHECK: [21] Code Region - G22
2129 # CHECK: Iterations: 100
2130 # CHECK-NEXT: Instructions: 1000
2131 # CHECK-NEXT: Total Cycles: 3410
2132 # CHECK-NEXT: Total uOps: 2600
2134 # CHECK: Dispatch Width: 3
2135 # CHECK-NEXT: uOps Per Cycle: 0.76
2136 # CHECK-NEXT: IPC: 0.29
2137 # CHECK-NEXT: Block RThroughput: 8.7
2139 # CHECK: Timeline view:
2140 # CHECK-NEXT: 0123456789 0123456789
2141 # CHECK-NEXT: Index 0123456789 0123456789 0123
2143 # CHECK: [0,0] DeeeeeeeeeER . . . . . . . ld2 { v1.16b, v2.16b }, [x27], x28
2144 # CHECK-NEXT: [0,1] .DeE-------R . . . . . . . add x0, x27, #1
2145 # CHECK-NEXT: [0,2] . D=======eeeeeeeeER. . . . . . ld2 { v1.b, v2.b }[0], [x27], #2
2146 # CHECK-NEXT: [0,3] . D=======eE------R. . . . . . add x0, x27, #1
2147 # CHECK-NEXT: [0,4] . D=============eeeeeeeeER . . . . ld2 { v1.b, v2.b }[8], [x27], #2
2148 # CHECK-NEXT: [0,5] . D=============eE------R . . . . add x0, x27, #1
2149 # CHECK-NEXT: [0,6] . .D===================eeeeeeeeER . . ld2 { v1.b, v2.b }[0], [x27], x28
2150 # CHECK-NEXT: [0,7] . . D===================eE------R . . add x0, x27, #1
2151 # CHECK-NEXT: [0,8] . . D=========================eeeeeeeeER ld2 { v1.b, v2.b }[8], [x27], x28
2152 # CHECK-NEXT: [0,9] . . D=========================eE------R add x0, x27, #1
2154 # CHECK: Average Wait times (based on the timeline view):
2155 # CHECK-NEXT: [0]: Executions
2156 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2157 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2158 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2160 # CHECK: [0] [1] [2] [3]
2161 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.16b, v2.16b }, [x27], x28
2162 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2163 # CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld2 { v1.b, v2.b }[0], [x27], #2
2164 # CHECK-NEXT: 3. 1 8.0 0.0 6.0 add x0, x27, #1
2165 # CHECK-NEXT: 4. 1 14.0 0.0 0.0 ld2 { v1.b, v2.b }[8], [x27], #2
2166 # CHECK-NEXT: 5. 1 14.0 0.0 6.0 add x0, x27, #1
2167 # CHECK-NEXT: 6. 1 20.0 0.0 0.0 ld2 { v1.b, v2.b }[0], [x27], x28
2168 # CHECK-NEXT: 7. 1 20.0 0.0 6.0 add x0, x27, #1
2169 # CHECK-NEXT: 8. 1 26.0 0.0 0.0 ld2 { v1.b, v2.b }[8], [x27], x28
2170 # CHECK-NEXT: 9. 1 26.0 0.0 6.0 add x0, x27, #1
2171 # CHECK-NEXT: 1 13.8 0.1 3.1 <total>
2173 # CHECK: [22] Code Region - G23
2175 # CHECK: Iterations: 100
2176 # CHECK-NEXT: Instructions: 1000
2177 # CHECK-NEXT: Total Cycles: 3803
2178 # CHECK-NEXT: Total uOps: 2400
2180 # CHECK: Dispatch Width: 3
2181 # CHECK-NEXT: uOps Per Cycle: 0.63
2182 # CHECK-NEXT: IPC: 0.26
2183 # CHECK-NEXT: Block RThroughput: 8.0
2185 # CHECK: Timeline view:
2186 # CHECK-NEXT: 0123456789 0123456789
2187 # CHECK-NEXT: Index 0123456789 0123456789 0
2189 # CHECK: [0,0] DeeeeeeeeER . . . . . . ld2 { v1.h, v2.h }[0], [x27], #4
2190 # CHECK-NEXT: [0,1] .DeE------R . . . . . . add x0, x27, #1
2191 # CHECK-NEXT: [0,2] . D======eeeeeeeeER . . . . . ld2 { v1.h, v2.h }[4], [x27], #4
2192 # CHECK-NEXT: [0,3] . D======eE------R . . . . . add x0, x27, #1
2193 # CHECK-NEXT: [0,4] . D============eeeeeeeeER . . . ld2 { v1.h, v2.h }[0], [x27], x28
2194 # CHECK-NEXT: [0,5] . D============eE------R . . . add x0, x27, #1
2195 # CHECK-NEXT: [0,6] . .D==================eeeeeeeeER. . ld2 { v1.h, v2.h }[4], [x27], x28
2196 # CHECK-NEXT: [0,7] . . D==================eE------R. . add x0, x27, #1
2197 # CHECK-NEXT: [0,8] . . D========================eeeeeeER ld2 { v1.s, v2.s }[0], [x27], #8
2198 # CHECK-NEXT: [0,9] . . D========================eE----R add x0, x27, #1
2200 # CHECK: Average Wait times (based on the timeline view):
2201 # CHECK-NEXT: [0]: Executions
2202 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2203 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2204 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2206 # CHECK: [0] [1] [2] [3]
2207 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.h, v2.h }[0], [x27], #4
2208 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
2209 # CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld2 { v1.h, v2.h }[4], [x27], #4
2210 # CHECK-NEXT: 3. 1 7.0 0.0 6.0 add x0, x27, #1
2211 # CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld2 { v1.h, v2.h }[0], [x27], x28
2212 # CHECK-NEXT: 5. 1 13.0 0.0 6.0 add x0, x27, #1
2213 # CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld2 { v1.h, v2.h }[4], [x27], x28
2214 # CHECK-NEXT: 7. 1 19.0 0.0 6.0 add x0, x27, #1
2215 # CHECK-NEXT: 8. 1 25.0 0.0 0.0 ld2 { v1.s, v2.s }[0], [x27], #8
2216 # CHECK-NEXT: 9. 1 25.0 0.0 4.0 add x0, x27, #1
2217 # CHECK-NEXT: 1 13.0 0.1 2.8 <total>
2219 # CHECK: [23] Code Region - G24
2221 # CHECK: Iterations: 100
2222 # CHECK-NEXT: Instructions: 1000
2223 # CHECK-NEXT: Total Cycles: 2403
2224 # CHECK-NEXT: Total uOps: 2000
2226 # CHECK: Dispatch Width: 3
2227 # CHECK-NEXT: uOps Per Cycle: 0.83
2228 # CHECK-NEXT: IPC: 0.42
2229 # CHECK-NEXT: Block RThroughput: 6.7
2231 # CHECK: Timeline view:
2232 # CHECK-NEXT: 0123456789
2233 # CHECK-NEXT: Index 0123456789 0123456
2235 # CHECK: [0,0] DeeeeeeER . . . .. ld2 { v1.s, v2.s }[0], [x27], x28
2236 # CHECK-NEXT: [0,1] .DeE----R . . . .. add x0, x27, #1
2237 # CHECK-NEXT: [0,2] . D====eeeeeeeeER . .. ld2 { v1.d, v2.d }[0], [x27], #16
2238 # CHECK-NEXT: [0,3] . D====eE------R . .. add x0, x27, #1
2239 # CHECK-NEXT: [0,4] . D==========eeeeeeeeER.. ld2 { v1.d, v2.d }[0], [x27], x28
2240 # CHECK-NEXT: [0,5] . D==========eE------R.. add x0, x27, #1
2241 # CHECK-NEXT: [0,6] . D==========eeeeeE--R.. ld2r { v1.1d, v2.1d }, [x27], #16
2242 # CHECK-NEXT: [0,7] . .D==========eE-----R.. add x0, x27, #1
2243 # CHECK-NEXT: [0,8] . . D=========eeeeeeeeER ld2r { v1.2d, v2.2d }, [x27], #16
2244 # CHECK-NEXT: [0,9] . . D=========eE------R add x0, x27, #1
2246 # CHECK: Average Wait times (based on the timeline view):
2247 # CHECK-NEXT: [0]: Executions
2248 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2249 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2250 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2252 # CHECK: [0] [1] [2] [3]
2253 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.s, v2.s }[0], [x27], x28
2254 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
2255 # CHECK-NEXT: 2. 1 5.0 0.0 0.0 ld2 { v1.d, v2.d }[0], [x27], #16
2256 # CHECK-NEXT: 3. 1 5.0 0.0 6.0 add x0, x27, #1
2257 # CHECK-NEXT: 4. 1 11.0 0.0 0.0 ld2 { v1.d, v2.d }[0], [x27], x28
2258 # CHECK-NEXT: 5. 1 11.0 0.0 6.0 add x0, x27, #1
2259 # CHECK-NEXT: 6. 1 11.0 0.0 2.0 ld2r { v1.1d, v2.1d }, [x27], #16
2260 # CHECK-NEXT: 7. 1 11.0 0.0 5.0 add x0, x27, #1
2261 # CHECK-NEXT: 8. 1 10.0 0.0 0.0 ld2r { v1.2d, v2.2d }, [x27], #16
2262 # CHECK-NEXT: 9. 1 10.0 0.0 6.0 add x0, x27, #1
2263 # CHECK-NEXT: 1 7.6 0.1 2.9 <total>
2265 # CHECK: [24] Code Region - G25
2267 # CHECK: Iterations: 100
2268 # CHECK-NEXT: Instructions: 1000
2269 # CHECK-NEXT: Total Cycles: 1009
2270 # CHECK-NEXT: Total uOps: 2200
2272 # CHECK: Dispatch Width: 3
2273 # CHECK-NEXT: uOps Per Cycle: 2.18
2274 # CHECK-NEXT: IPC: 0.99
2275 # CHECK-NEXT: Block RThroughput: 7.3
2277 # CHECK: Timeline view:
2278 # CHECK-NEXT: 012345678
2279 # CHECK-NEXT: Index 0123456789
2281 # CHECK: [0,0] DeeeeeeeeER . . ld2r { v1.2s, v2.2s }, [x27], #8
2282 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
2283 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld2r { v1.4h, v2.4h }, [x27], #4
2284 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
2285 # CHECK-NEXT: [0,4] . DeeeeeeeeER. . ld2r { v1.4s, v2.4s }, [x27], #8
2286 # CHECK-NEXT: [0,5] . DeE------R. . add x0, x27, #1
2287 # CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld2r { v1.8b, v2.8b }, [x27], #2
2288 # CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1
2289 # CHECK-NEXT: [0,8] . . DeeeeeeeeER ld2r { v1.8h, v2.8h }, [x27], #4
2290 # CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1
2292 # CHECK: Average Wait times (based on the timeline view):
2293 # CHECK-NEXT: [0]: Executions
2294 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2295 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2296 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2298 # CHECK: [0] [1] [2] [3]
2299 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.2s, v2.2s }, [x27], #8
2300 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
2301 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld2r { v1.4h, v2.4h }, [x27], #4
2302 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
2303 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2r { v1.4s, v2.4s }, [x27], #8
2304 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
2305 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2r { v1.8b, v2.8b }, [x27], #2
2306 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
2307 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld2r { v1.8h, v2.8h }, [x27], #4
2308 # CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1
2309 # CHECK-NEXT: 1 1.0 0.5 3.0 <total>
2311 # CHECK: [25] Code Region - G26
2313 # CHECK: Iterations: 100
2314 # CHECK-NEXT: Instructions: 1000
2315 # CHECK-NEXT: Total Cycles: 909
2316 # CHECK-NEXT: Total uOps: 2100
2318 # CHECK: Dispatch Width: 3
2319 # CHECK-NEXT: uOps Per Cycle: 2.31
2320 # CHECK-NEXT: IPC: 1.10
2321 # CHECK-NEXT: Block RThroughput: 7.0
2323 # CHECK: Timeline view:
2324 # CHECK-NEXT: 01234567
2325 # CHECK-NEXT: Index 0123456789
2327 # CHECK: [0,0] DeeeeeeeeER . . ld2r { v1.16b, v2.16b }, [x27], #2
2328 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
2329 # CHECK-NEXT: [0,2] . DeeeeeE-R . . ld2r { v1.1d, v2.1d }, [x27], x28
2330 # CHECK-NEXT: [0,3] . D=eE----R . . add x0, x27, #1
2331 # CHECK-NEXT: [0,4] . DeeeeeeeeER . . ld2r { v1.2d, v2.2d }, [x27], x28
2332 # CHECK-NEXT: [0,5] . DeE------R . . add x0, x27, #1
2333 # CHECK-NEXT: [0,6] . DeeeeeeeeER . ld2r { v1.2s, v2.2s }, [x27], x28
2334 # CHECK-NEXT: [0,7] . .DeE------R . add x0, x27, #1
2335 # CHECK-NEXT: [0,8] . . DeeeeeeeeER ld2r { v1.4h, v2.4h }, [x27], x28
2336 # CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1
2338 # CHECK: Average Wait times (based on the timeline view):
2339 # CHECK-NEXT: [0]: Executions
2340 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2341 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2342 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2344 # CHECK: [0] [1] [2] [3]
2345 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.16b, v2.16b }, [x27], #2
2346 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
2347 # CHECK-NEXT: 2. 1 1.0 1.0 1.0 ld2r { v1.1d, v2.1d }, [x27], x28
2348 # CHECK-NEXT: 3. 1 2.0 0.0 4.0 add x0, x27, #1
2349 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld2r { v1.2d, v2.2d }, [x27], x28
2350 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
2351 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2r { v1.2s, v2.2s }, [x27], x28
2352 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
2353 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld2r { v1.4h, v2.4h }, [x27], x28
2354 # CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1
2355 # CHECK-NEXT: 1 1.1 0.4 2.9 <total>
2357 # CHECK: [26] Code Region - G27
2359 # CHECK: Iterations: 100
2360 # CHECK-NEXT: Instructions: 1000
2361 # CHECK-NEXT: Total Cycles: 1009
2362 # CHECK-NEXT: Total uOps: 2500
2364 # CHECK: Dispatch Width: 3
2365 # CHECK-NEXT: uOps Per Cycle: 2.48
2366 # CHECK-NEXT: IPC: 0.99
2367 # CHECK-NEXT: Block RThroughput: 8.3
2369 # CHECK: Timeline view:
2370 # CHECK-NEXT: 012345678
2371 # CHECK-NEXT: Index 0123456789
2373 # CHECK: [0,0] DeeeeeeeeER . . ld2r { v1.4s, v2.4s }, [x27], x28
2374 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
2375 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld2r { v1.8b, v2.8b }, [x27], x28
2376 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
2377 # CHECK-NEXT: [0,4] . DeeeeeeeeER. . ld2r { v1.8h, v2.8h }, [x27], x28
2378 # CHECK-NEXT: [0,5] . DeE------R. . add x0, x27, #1
2379 # CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld2r { v1.16b, v2.16b }, [x27], x28
2380 # CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1
2381 # CHECK-NEXT: [0,8] . . DeeeeeeeeER ld3 { v1.2d, v2.2d, v3.2d }, [x27], #48
2382 # CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1
2384 # CHECK: Average Wait times (based on the timeline view):
2385 # CHECK-NEXT: [0]: Executions
2386 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2387 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2388 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2390 # CHECK: [0] [1] [2] [3]
2391 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.4s, v2.4s }, [x27], x28
2392 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
2393 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld2r { v1.8b, v2.8b }, [x27], x28
2394 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
2395 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2r { v1.8h, v2.8h }, [x27], x28
2396 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
2397 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2r { v1.16b, v2.16b }, [x27], x28
2398 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
2399 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3 { v1.2d, v2.2d, v3.2d }, [x27], #48
2400 # CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1
2401 # CHECK-NEXT: 1 1.0 0.5 3.0 <total>
2403 # CHECK: [27] Code Region - G28
2405 # CHECK: Iterations: 100
2406 # CHECK-NEXT: Instructions: 1000
2407 # CHECK-NEXT: Total Cycles: 1210
2408 # CHECK-NEXT: Total uOps: 3600
2410 # CHECK: Dispatch Width: 3
2411 # CHECK-NEXT: uOps Per Cycle: 2.98
2412 # CHECK-NEXT: IPC: 0.83
2413 # CHECK-NEXT: Block RThroughput: 12.0
2415 # CHECK: Timeline view:
2416 # CHECK-NEXT: 0123456789
2417 # CHECK-NEXT: Index 0123456789 01
2419 # CHECK: [0,0] DeeeeeeeeeER . .. ld3 { v1.2s, v2.2s, v3.2s }, [x27], #24
2420 # CHECK-NEXT: [0,1] .DeE-------R . .. add x0, x27, #1
2421 # CHECK-NEXT: [0,2] . DeeeeeeeeeER . .. ld3 { v1.4h, v2.4h, v3.4h }, [x27], #24
2422 # CHECK-NEXT: [0,3] . DeE-------R . .. add x0, x27, #1
2423 # CHECK-NEXT: [0,4] . DeeeeeeeeeeER .. ld3 { v1.4s, v2.4s, v3.4s }, [x27], #48
2424 # CHECK-NEXT: [0,5] . .DeE-------R .. add x0, x27, #1
2425 # CHECK-NEXT: [0,6] . . DeeeeeeeeeER .. ld3 { v1.8b, v2.8b, v3.8b }, [x27], #24
2426 # CHECK-NEXT: [0,7] . . DeE-------R .. add x0, x27, #1
2427 # CHECK-NEXT: [0,8] . . DeeeeeeeeeeER ld3 { v1.8h, v2.8h, v3.8h }, [x27], #48
2428 # CHECK-NEXT: [0,9] . . .DeE-------R add x0, x27, #1
2430 # CHECK: Average Wait times (based on the timeline view):
2431 # CHECK-NEXT: [0]: Executions
2432 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2433 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2434 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2436 # CHECK: [0] [1] [2] [3]
2437 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.2s, v2.2s, v3.2s }, [x27], #24
2438 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2439 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3 { v1.4h, v2.4h, v3.4h }, [x27], #24
2440 # CHECK-NEXT: 3. 1 1.0 0.0 7.0 add x0, x27, #1
2441 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3 { v1.4s, v2.4s, v3.4s }, [x27], #48
2442 # CHECK-NEXT: 5. 1 1.0 1.0 7.0 add x0, x27, #1
2443 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld3 { v1.8b, v2.8b, v3.8b }, [x27], #24
2444 # CHECK-NEXT: 7. 1 1.0 0.0 7.0 add x0, x27, #1
2445 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3 { v1.8h, v2.8h, v3.8h }, [x27], #48
2446 # CHECK-NEXT: 9. 1 1.0 1.0 7.0 add x0, x27, #1
2447 # CHECK-NEXT: 1 1.0 0.7 3.5 <total>
2449 # CHECK: [28] Code Region - G29
2451 # CHECK: Iterations: 100
2452 # CHECK-NEXT: Instructions: 1000
2453 # CHECK-NEXT: Total Cycles: 1410
2454 # CHECK-NEXT: Total uOps: 3600
2456 # CHECK: Dispatch Width: 3
2457 # CHECK-NEXT: uOps Per Cycle: 2.55
2458 # CHECK-NEXT: IPC: 0.71
2459 # CHECK-NEXT: Block RThroughput: 14.0
2461 # CHECK: Timeline view:
2462 # CHECK-NEXT: 0123456789
2463 # CHECK-NEXT: Index 0123456789 0123
2465 # CHECK: [0,0] DeeeeeeeeeeER . . . ld3 { v1.16b, v2.16b, v3.16b }, [x27], #48
2466 # CHECK-NEXT: [0,1] . DeE-------R . . . add x0, x27, #1
2467 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . . ld3 { v1.2d, v2.2d, v3.2d }, [x27], x28
2468 # CHECK-NEXT: [0,3] . DeE------R . . . add x0, x27, #1
2469 # CHECK-NEXT: [0,4] . D==eeeeeeeeeER . . ld3 { v1.2s, v2.2s, v3.2s }, [x27], x28
2470 # CHECK-NEXT: [0,5] . .D==eE-------R . . add x0, x27, #1
2471 # CHECK-NEXT: [0,6] . . D==eeeeeeeeeER . ld3 { v1.4h, v2.4h, v3.4h }, [x27], x28
2472 # CHECK-NEXT: [0,7] . . D==eE-------R . add x0, x27, #1
2473 # CHECK-NEXT: [0,8] . . D==eeeeeeeeeeER ld3 { v1.4s, v2.4s, v3.4s }, [x27], x28
2474 # CHECK-NEXT: [0,9] . . .D=eE--------R add x0, x27, #1
2476 # CHECK: Average Wait times (based on the timeline view):
2477 # CHECK-NEXT: [0]: Executions
2478 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2479 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2480 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2482 # CHECK: [0] [1] [2] [3]
2483 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.16b, v2.16b, v3.16b }, [x27], #48
2484 # CHECK-NEXT: 1. 1 1.0 1.0 7.0 add x0, x27, #1
2485 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3 { v1.2d, v2.2d, v3.2d }, [x27], x28
2486 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
2487 # CHECK-NEXT: 4. 1 3.0 3.0 0.0 ld3 { v1.2s, v2.2s, v3.2s }, [x27], x28
2488 # CHECK-NEXT: 5. 1 3.0 0.0 7.0 add x0, x27, #1
2489 # CHECK-NEXT: 6. 1 3.0 1.0 0.0 ld3 { v1.4h, v2.4h, v3.4h }, [x27], x28
2490 # CHECK-NEXT: 7. 1 3.0 0.0 7.0 add x0, x27, #1
2491 # CHECK-NEXT: 8. 1 3.0 1.0 0.0 ld3 { v1.4s, v2.4s, v3.4s }, [x27], x28
2492 # CHECK-NEXT: 9. 1 2.0 0.0 8.0 add x0, x27, #1
2493 # CHECK-NEXT: 1 2.1 0.8 3.5 <total>
2495 # CHECK: [29] Code Region - G30
2497 # CHECK: Iterations: 100
2498 # CHECK-NEXT: Instructions: 1000
2499 # CHECK-NEXT: Total Cycles: 2511
2500 # CHECK-NEXT: Total uOps: 3600
2502 # CHECK: Dispatch Width: 3
2503 # CHECK-NEXT: uOps Per Cycle: 1.43
2504 # CHECK-NEXT: IPC: 0.40
2505 # CHECK-NEXT: Block RThroughput: 12.0
2507 # CHECK: Timeline view:
2508 # CHECK-NEXT: 0123456789 012345
2509 # CHECK-NEXT: Index 0123456789 0123456789
2511 # CHECK: [0,0] DeeeeeeeeeER . . . . . ld3 { v1.8b, v2.8b, v3.8b }, [x27], x28
2512 # CHECK-NEXT: [0,1] .DeE-------R . . . . . add x0, x27, #1
2513 # CHECK-NEXT: [0,2] . DeeeeeeeeeeER. . . . . ld3 { v1.8h, v2.8h, v3.8h }, [x27], x28
2514 # CHECK-NEXT: [0,3] . DeE-------R. . . . . add x0, x27, #1
2515 # CHECK-NEXT: [0,4] . DeeeeeeeeeeER . . . . ld3 { v1.16b, v2.16b, v3.16b }, [x27], x28
2516 # CHECK-NEXT: [0,5] . . DeE-------R . . . . add x0, x27, #1
2517 # CHECK-NEXT: [0,6] . . D=======eeeeeeeeeER . . ld3 { v1.b, v2.b, v3.b }[0], [x27], #3
2518 # CHECK-NEXT: [0,7] . . D=======eE-------R . . add x0, x27, #1
2519 # CHECK-NEXT: [0,8] . . D==============eeeeeeeeeER ld3 { v1.b, v2.b, v3.b }[8], [x27], #3
2520 # CHECK-NEXT: [0,9] . . .D==============eE-------R add x0, x27, #1
2522 # CHECK: Average Wait times (based on the timeline view):
2523 # CHECK-NEXT: [0]: Executions
2524 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2525 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2526 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2528 # CHECK: [0] [1] [2] [3]
2529 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.8b, v2.8b, v3.8b }, [x27], x28
2530 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2531 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3 { v1.8h, v2.8h, v3.8h }, [x27], x28
2532 # CHECK-NEXT: 3. 1 1.0 1.0 7.0 add x0, x27, #1
2533 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3 { v1.16b, v2.16b, v3.16b }, [x27], x28
2534 # CHECK-NEXT: 5. 1 1.0 1.0 7.0 add x0, x27, #1
2535 # CHECK-NEXT: 6. 1 8.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[0], [x27], #3
2536 # CHECK-NEXT: 7. 1 8.0 0.0 7.0 add x0, x27, #1
2537 # CHECK-NEXT: 8. 1 15.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[8], [x27], #3
2538 # CHECK-NEXT: 9. 1 15.0 0.0 7.0 add x0, x27, #1
2539 # CHECK-NEXT: 1 5.2 0.5 3.5 <total>
2541 # CHECK: [30] Code Region - G31
2543 # CHECK: Iterations: 100
2544 # CHECK-NEXT: Instructions: 1000
2545 # CHECK-NEXT: Total Cycles: 4503
2546 # CHECK-NEXT: Total uOps: 3000
2548 # CHECK: Dispatch Width: 3
2549 # CHECK-NEXT: uOps Per Cycle: 0.67
2550 # CHECK-NEXT: IPC: 0.22
2551 # CHECK-NEXT: Block RThroughput: 10.0
2553 # CHECK: Timeline view:
2554 # CHECK-NEXT: 0123456789 0123456789
2555 # CHECK-NEXT: Index 0123456789 0123456789 01234567
2557 # CHECK: [0,0] DeeeeeeeeeER . . . . . . . . ld3 { v1.b, v2.b, v3.b }[0], [x27], x28
2558 # CHECK-NEXT: [0,1] .DeE-------R . . . . . . . . add x0, x27, #1
2559 # CHECK-NEXT: [0,2] . D=======eeeeeeeeeER . . . . . . ld3 { v1.b, v2.b, v3.b }[8], [x27], x28
2560 # CHECK-NEXT: [0,3] . D=======eE-------R . . . . . . add x0, x27, #1
2561 # CHECK-NEXT: [0,4] . D==============eeeeeeeeeER. . . . . ld3 { v1.h, v2.h, v3.h }[0], [x27], #6
2562 # CHECK-NEXT: [0,5] . D==============eE-------R. . . . . add x0, x27, #1
2563 # CHECK-NEXT: [0,6] . .D=====================eeeeeeeeeER . . . ld3 { v1.h, v2.h, v3.h }[4], [x27], #6
2564 # CHECK-NEXT: [0,7] . . D=====================eE-------R . . . add x0, x27, #1
2565 # CHECK-NEXT: [0,8] . . D============================eeeeeeeeeER ld3 { v1.h, v2.h, v3.h }[0], [x27], x28
2566 # CHECK-NEXT: [0,9] . . D============================eE-------R add x0, x27, #1
2568 # CHECK: Average Wait times (based on the timeline view):
2569 # CHECK-NEXT: [0]: Executions
2570 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2571 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2572 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2574 # CHECK: [0] [1] [2] [3]
2575 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.b, v2.b, v3.b }[0], [x27], x28
2576 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2577 # CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[8], [x27], x28
2578 # CHECK-NEXT: 3. 1 8.0 0.0 7.0 add x0, x27, #1
2579 # CHECK-NEXT: 4. 1 15.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[0], [x27], #6
2580 # CHECK-NEXT: 5. 1 15.0 0.0 7.0 add x0, x27, #1
2581 # CHECK-NEXT: 6. 1 22.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[4], [x27], #6
2582 # CHECK-NEXT: 7. 1 22.0 0.0 7.0 add x0, x27, #1
2583 # CHECK-NEXT: 8. 1 29.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[0], [x27], x28
2584 # CHECK-NEXT: 9. 1 29.0 0.0 7.0 add x0, x27, #1
2585 # CHECK-NEXT: 1 15.0 0.1 3.5 <total>
2587 # CHECK: [31] Code Region - G32
2589 # CHECK: Iterations: 100
2590 # CHECK-NEXT: Instructions: 1000
2591 # CHECK-NEXT: Total Cycles: 3703
2592 # CHECK-NEXT: Total uOps: 2400
2594 # CHECK: Dispatch Width: 3
2595 # CHECK-NEXT: uOps Per Cycle: 0.65
2596 # CHECK-NEXT: IPC: 0.27
2597 # CHECK-NEXT: Block RThroughput: 8.0
2599 # CHECK: Timeline view:
2600 # CHECK-NEXT: 0123456789 0123456789
2601 # CHECK-NEXT: Index 0123456789 0123456789
2603 # CHECK: [0,0] DeeeeeeeeeER . . . . . . ld3 { v1.h, v2.h, v3.h }[4], [x27], x28
2604 # CHECK-NEXT: [0,1] .DeE-------R . . . . . . add x0, x27, #1
2605 # CHECK-NEXT: [0,2] . D=======eeeeeeeeER. . . . . ld3 { v1.s, v2.s, v3.s }[0], [x27], #12
2606 # CHECK-NEXT: [0,3] . D=======eE------R. . . . . add x0, x27, #1
2607 # CHECK-NEXT: [0,4] . D=============eeeeeeeeER . . . ld3 { v1.s, v2.s, v3.s }[0], [x27], x28
2608 # CHECK-NEXT: [0,5] . D=============eE------R . . . add x0, x27, #1
2609 # CHECK-NEXT: [0,6] . .D===================eeeeeeER . . ld3 { v1.d, v2.d, v3.d }[0], [x27], #24
2610 # CHECK-NEXT: [0,7] . . D===================eE----R . . add x0, x27, #1
2611 # CHECK-NEXT: [0,8] . . D=======================eeeeeeER ld3 { v1.d, v2.d, v3.d }[0], [x27], x28
2612 # CHECK-NEXT: [0,9] . . D=======================eE----R add x0, x27, #1
2614 # CHECK: Average Wait times (based on the timeline view):
2615 # CHECK-NEXT: [0]: Executions
2616 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2617 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2618 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2620 # CHECK: [0] [1] [2] [3]
2621 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.h, v2.h, v3.h }[4], [x27], x28
2622 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2623 # CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld3 { v1.s, v2.s, v3.s }[0], [x27], #12
2624 # CHECK-NEXT: 3. 1 8.0 0.0 6.0 add x0, x27, #1
2625 # CHECK-NEXT: 4. 1 14.0 0.0 0.0 ld3 { v1.s, v2.s, v3.s }[0], [x27], x28
2626 # CHECK-NEXT: 5. 1 14.0 0.0 6.0 add x0, x27, #1
2627 # CHECK-NEXT: 6. 1 20.0 0.0 0.0 ld3 { v1.d, v2.d, v3.d }[0], [x27], #24
2628 # CHECK-NEXT: 7. 1 20.0 0.0 4.0 add x0, x27, #1
2629 # CHECK-NEXT: 8. 1 24.0 0.0 0.0 ld3 { v1.d, v2.d, v3.d }[0], [x27], x28
2630 # CHECK-NEXT: 9. 1 24.0 0.0 4.0 add x0, x27, #1
2631 # CHECK-NEXT: 1 13.4 0.1 2.7 <total>
2633 # CHECK: [32] Code Region - G33
2635 # CHECK: Iterations: 100
2636 # CHECK-NEXT: Instructions: 1000
2637 # CHECK-NEXT: Total Cycles: 1110
2638 # CHECK-NEXT: Total uOps: 2700
2640 # CHECK: Dispatch Width: 3
2641 # CHECK-NEXT: uOps Per Cycle: 2.43
2642 # CHECK-NEXT: IPC: 0.90
2643 # CHECK-NEXT: Block RThroughput: 9.0
2645 # CHECK: Timeline view:
2646 # CHECK-NEXT: 0123456789
2647 # CHECK-NEXT: Index 0123456789 0
2649 # CHECK: [0,0] DeeeeeeER . . . ld3r { v1.1d, v2.1d, v3.1d }, [x27], #24
2650 # CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1
2651 # CHECK-NEXT: [0,2] . DeeeeeeeeeER . . ld3r { v1.2d, v2.2d, v3.2d }, [x27], #24
2652 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
2653 # CHECK-NEXT: [0,4] . DeeeeeeeeER . ld3r { v1.2s, v2.2s, v3.2s }, [x27], #12
2654 # CHECK-NEXT: [0,5] . .DeE------R . add x0, x27, #1
2655 # CHECK-NEXT: [0,6] . . DeeeeeeeeER . ld3r { v1.4h, v2.4h, v3.4h }, [x27], #6
2656 # CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1
2657 # CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld3r { v1.4s, v2.4s, v3.4s }, [x27], #12
2658 # CHECK-NEXT: [0,9] . . DeE-------R add x0, x27, #1
2660 # CHECK: Average Wait times (based on the timeline view):
2661 # CHECK-NEXT: [0]: Executions
2662 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2663 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2664 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2666 # CHECK: [0] [1] [2] [3]
2667 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.1d, v2.1d, v3.1d }, [x27], #24
2668 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
2669 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3r { v1.2d, v2.2d, v3.2d }, [x27], #24
2670 # CHECK-NEXT: 3. 1 1.0 1.0 6.0 add x0, x27, #1
2671 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3r { v1.2s, v2.2s, v3.2s }, [x27], #12
2672 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
2673 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld3r { v1.4h, v2.4h, v3.4h }, [x27], #6
2674 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
2675 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3r { v1.4s, v2.4s, v3.4s }, [x27], #12
2676 # CHECK-NEXT: 9. 1 1.0 0.0 7.0 add x0, x27, #1
2677 # CHECK-NEXT: 1 1.0 0.6 2.9 <total>
2679 # CHECK: [33] Code Region - G34
2681 # CHECK: Iterations: 100
2682 # CHECK-NEXT: Instructions: 1000
2683 # CHECK-NEXT: Total Cycles: 1109
2684 # CHECK-NEXT: Total uOps: 2800
2686 # CHECK: Dispatch Width: 3
2687 # CHECK-NEXT: uOps Per Cycle: 2.52
2688 # CHECK-NEXT: IPC: 0.90
2689 # CHECK-NEXT: Block RThroughput: 9.3
2691 # CHECK: Timeline view:
2692 # CHECK-NEXT: 0123456789
2693 # CHECK-NEXT: Index 0123456789
2695 # CHECK: [0,0] DeeeeeeeeER . . ld3r { v1.8b, v2.8b, v3.8b }, [x27], #3
2696 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
2697 # CHECK-NEXT: [0,2] . DeeeeeeeeeER . . ld3r { v1.8h, v2.8h, v3.8h }, [x27], #6
2698 # CHECK-NEXT: [0,3] . DeE-------R . . add x0, x27, #1
2699 # CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld3r { v1.16b, v2.16b, v3.16b }, [x27], #3
2700 # CHECK-NEXT: [0,5] . DeE-------R . add x0, x27, #1
2701 # CHECK-NEXT: [0,6] . .DeeeeeeE-R . ld3r { v1.1d, v2.1d, v3.1d }, [x27], x28
2702 # CHECK-NEXT: [0,7] . . DeE-----R . add x0, x27, #1
2703 # CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld3r { v1.2d, v2.2d, v3.2d }, [x27], x28
2704 # CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1
2706 # CHECK: Average Wait times (based on the timeline view):
2707 # CHECK-NEXT: [0]: Executions
2708 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2709 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2710 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2712 # CHECK: [0] [1] [2] [3]
2713 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.8b, v2.8b, v3.8b }, [x27], #3
2714 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
2715 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3r { v1.8h, v2.8h, v3.8h }, [x27], #6
2716 # CHECK-NEXT: 3. 1 1.0 0.0 7.0 add x0, x27, #1
2717 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3r { v1.16b, v2.16b, v3.16b }, [x27], #3
2718 # CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1
2719 # CHECK-NEXT: 6. 1 1.0 1.0 1.0 ld3r { v1.1d, v2.1d, v3.1d }, [x27], x28
2720 # CHECK-NEXT: 7. 1 1.0 0.0 5.0 add x0, x27, #1
2721 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3r { v1.2d, v2.2d, v3.2d }, [x27], x28
2722 # CHECK-NEXT: 9. 1 1.0 1.0 6.0 add x0, x27, #1
2723 # CHECK-NEXT: 1 1.0 0.6 3.2 <total>
2725 # CHECK: [34] Code Region - G35
2727 # CHECK: Iterations: 100
2728 # CHECK-NEXT: Instructions: 1000
2729 # CHECK-NEXT: Total Cycles: 1010
2730 # CHECK-NEXT: Total uOps: 2700
2732 # CHECK: Dispatch Width: 3
2733 # CHECK-NEXT: uOps Per Cycle: 2.67
2734 # CHECK-NEXT: IPC: 0.99
2735 # CHECK-NEXT: Block RThroughput: 9.0
2737 # CHECK: Timeline view:
2738 # CHECK-NEXT: 0123456789
2739 # CHECK-NEXT: Index 0123456789
2741 # CHECK: [0,0] DeeeeeeeeER . . ld3r { v1.2s, v2.2s, v3.2s }, [x27], x28
2742 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
2743 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld3r { v1.4h, v2.4h, v3.4h }, [x27], x28
2744 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
2745 # CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld3r { v1.4s, v2.4s, v3.4s }, [x27], x28
2746 # CHECK-NEXT: [0,5] . DeE-------R . add x0, x27, #1
2747 # CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld3r { v1.8b, v2.8b, v3.8b }, [x27], x28
2748 # CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1
2749 # CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld3r { v1.8h, v2.8h, v3.8h }, [x27], x28
2750 # CHECK-NEXT: [0,9] . . DeE-------R add x0, x27, #1
2752 # CHECK: Average Wait times (based on the timeline view):
2753 # CHECK-NEXT: [0]: Executions
2754 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2755 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2756 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2758 # CHECK: [0] [1] [2] [3]
2759 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.2s, v2.2s, v3.2s }, [x27], x28
2760 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
2761 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3r { v1.4h, v2.4h, v3.4h }, [x27], x28
2762 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
2763 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3r { v1.4s, v2.4s, v3.4s }, [x27], x28
2764 # CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1
2765 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld3r { v1.8b, v2.8b, v3.8b }, [x27], x28
2766 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
2767 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3r { v1.8h, v2.8h, v3.8h }, [x27], x28
2768 # CHECK-NEXT: 9. 1 1.0 0.0 7.0 add x0, x27, #1
2769 # CHECK-NEXT: 1 1.0 0.5 3.2 <total>
2771 # CHECK: [35] Code Region - G36
2773 # CHECK: Iterations: 100
2774 # CHECK-NEXT: Instructions: 1000
2775 # CHECK-NEXT: Total Cycles: 1311
2776 # CHECK-NEXT: Total uOps: 3400
2778 # CHECK: Dispatch Width: 3
2779 # CHECK-NEXT: uOps Per Cycle: 2.59
2780 # CHECK-NEXT: IPC: 0.76
2781 # CHECK-NEXT: Block RThroughput: 13.0
2783 # CHECK: Timeline view:
2784 # CHECK-NEXT: 0123456789
2785 # CHECK-NEXT: Index 0123456789 0123
2787 # CHECK: [0,0] DeeeeeeeeeER . . . ld3r { v1.16b, v2.16b, v3.16b }, [x27], x28
2788 # CHECK-NEXT: [0,1] .DeE-------R . . . add x0, x27, #1
2789 # CHECK-NEXT: [0,2] . DeeeeeeeeER . . . ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
2790 # CHECK-NEXT: [0,3] . DeE------R . . . add x0, x27, #1
2791 # CHECK-NEXT: [0,4] . D==eeeeeeeeeER . . ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
2792 # CHECK-NEXT: [0,5] . D==eE-------R . . add x0, x27, #1
2793 # CHECK-NEXT: [0,6] . .D==eeeeeeeeeER. . ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
2794 # CHECK-NEXT: [0,7] . . D==eE-------R. . add x0, x27, #1
2795 # CHECK-NEXT: [0,8] . . D==eeeeeeeeeeeER ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
2796 # CHECK-NEXT: [0,9] . . .DeE---------R add x0, x27, #1
2798 # CHECK: Average Wait times (based on the timeline view):
2799 # CHECK-NEXT: [0]: Executions
2800 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2801 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2802 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2804 # CHECK: [0] [1] [2] [3]
2805 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.16b, v2.16b, v3.16b }, [x27], x28
2806 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2807 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
2808 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
2809 # CHECK-NEXT: 4. 1 3.0 3.0 0.0 ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
2810 # CHECK-NEXT: 5. 1 3.0 0.0 7.0 add x0, x27, #1
2811 # CHECK-NEXT: 6. 1 3.0 1.0 0.0 ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
2812 # CHECK-NEXT: 7. 1 3.0 0.0 7.0 add x0, x27, #1
2813 # CHECK-NEXT: 8. 1 3.0 1.0 0.0 ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
2814 # CHECK-NEXT: 9. 1 1.0 0.0 9.0 add x0, x27, #1
2815 # CHECK-NEXT: 1 2.0 0.7 3.6 <total>
2817 # CHECK: [36] Code Region - G37
2819 # CHECK: Iterations: 100
2820 # CHECK-NEXT: Instructions: 1000
2821 # CHECK-NEXT: Total Cycles: 1610
2822 # CHECK-NEXT: Total uOps: 3800
2824 # CHECK: Dispatch Width: 3
2825 # CHECK-NEXT: uOps Per Cycle: 2.36
2826 # CHECK-NEXT: IPC: 0.62
2827 # CHECK-NEXT: Block RThroughput: 16.0
2829 # CHECK: Timeline view:
2830 # CHECK-NEXT: 0123456789
2831 # CHECK-NEXT: Index 0123456789 012345
2833 # CHECK: [0,0] DeeeeeeeeeER . . . ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
2834 # CHECK-NEXT: [0,1] .DeE-------R . . . add x0, x27, #1
2835 # CHECK-NEXT: [0,2] . DeeeeeeeeeeeER . . ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
2836 # CHECK-NEXT: [0,3] . DeE-------R . . add x0, x27, #1
2837 # CHECK-NEXT: [0,4] . .DeeeeeeeeeeeER. . ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
2838 # CHECK-NEXT: [0,5] . . DeE-------R. . add x0, x27, #1
2839 # CHECK-NEXT: [0,6] . . DeeeeeeeeER . ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
2840 # CHECK-NEXT: [0,7] . . .DeE------R . add x0, x27, #1
2841 # CHECK-NEXT: [0,8] . . . D==eeeeeeeeeER ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
2842 # CHECK-NEXT: [0,9] . . . D==eE-------R add x0, x27, #1
2844 # CHECK: Average Wait times (based on the timeline view):
2845 # CHECK-NEXT: [0]: Executions
2846 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2847 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2848 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2850 # CHECK: [0] [1] [2] [3]
2851 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
2852 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2853 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
2854 # CHECK-NEXT: 3. 1 1.0 1.0 7.0 add x0, x27, #1
2855 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
2856 # CHECK-NEXT: 5. 1 1.0 1.0 7.0 add x0, x27, #1
2857 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
2858 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
2859 # CHECK-NEXT: 8. 1 3.0 3.0 0.0 ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
2860 # CHECK-NEXT: 9. 1 3.0 0.0 7.0 add x0, x27, #1
2861 # CHECK-NEXT: 1 1.4 0.9 3.4 <total>
2863 # CHECK: [37] Code Region - G38
2865 # CHECK: Iterations: 100
2866 # CHECK-NEXT: Instructions: 1000
2867 # CHECK-NEXT: Total Cycles: 1610
2868 # CHECK-NEXT: Total uOps: 4200
2870 # CHECK: Dispatch Width: 3
2871 # CHECK-NEXT: uOps Per Cycle: 2.61
2872 # CHECK-NEXT: IPC: 0.62
2873 # CHECK-NEXT: Block RThroughput: 16.0
2875 # CHECK: Timeline view:
2876 # CHECK-NEXT: 0123456789
2877 # CHECK-NEXT: Index 0123456789 012345
2879 # CHECK: [0,0] DeeeeeeeeeER . . . ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
2880 # CHECK-NEXT: [0,1] .DeE-------R . . . add x0, x27, #1
2881 # CHECK-NEXT: [0,2] . DeeeeeeeeeeeER . . ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
2882 # CHECK-NEXT: [0,3] . DeE-------R . . add x0, x27, #1
2883 # CHECK-NEXT: [0,4] . .DeeeeeeeeeER . . ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
2884 # CHECK-NEXT: [0,5] . . DeE-------R . . add x0, x27, #1
2885 # CHECK-NEXT: [0,6] . . DeeeeeeeeeeeER . ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
2886 # CHECK-NEXT: [0,7] . . .DeE-------R . add x0, x27, #1
2887 # CHECK-NEXT: [0,8] . . . DeeeeeeeeeeeER ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
2888 # CHECK-NEXT: [0,9] . . . DeE-------R add x0, x27, #1
2890 # CHECK: Average Wait times (based on the timeline view):
2891 # CHECK-NEXT: [0]: Executions
2892 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2893 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2894 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2896 # CHECK: [0] [1] [2] [3]
2897 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
2898 # CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1
2899 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
2900 # CHECK-NEXT: 3. 1 1.0 1.0 7.0 add x0, x27, #1
2901 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
2902 # CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1
2903 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
2904 # CHECK-NEXT: 7. 1 1.0 1.0 7.0 add x0, x27, #1
2905 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
2906 # CHECK-NEXT: 9. 1 1.0 1.0 7.0 add x0, x27, #1
2907 # CHECK-NEXT: 1 1.0 0.8 3.5 <total>
2909 # CHECK: [38] Code Region - G39
2911 # CHECK: Iterations: 100
2912 # CHECK-NEXT: Instructions: 1000
2913 # CHECK-NEXT: Total Cycles: 4503
2914 # CHECK-NEXT: Total uOps: 3500
2916 # CHECK: Dispatch Width: 3
2917 # CHECK-NEXT: uOps Per Cycle: 0.78
2918 # CHECK-NEXT: IPC: 0.22
2919 # CHECK-NEXT: Block RThroughput: 11.7
2921 # CHECK: Timeline view:
2922 # CHECK-NEXT: 0123456789 0123456789
2923 # CHECK-NEXT: Index 0123456789 0123456789 01234567
2925 # CHECK: [0,0] DeeeeeeeeeER . . . . . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
2926 # CHECK-NEXT: [0,1] . DeE------R . . . . . . . . add x0, x27, #1
2927 # CHECK-NEXT: [0,2] . D======eeeeeeeeeER . . . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
2928 # CHECK-NEXT: [0,3] . D=====eE-------R . . . . . . add x0, x27, #1
2929 # CHECK-NEXT: [0,4] . .D============eeeeeeeeeER. . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
2930 # CHECK-NEXT: [0,5] . . D===========eE-------R. . . . . add x0, x27, #1
2931 # CHECK-NEXT: [0,6] . . D==================eeeeeeeeeER . . . ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
2932 # CHECK-NEXT: [0,7] . . .D=================eE-------R . . . add x0, x27, #1
2933 # CHECK-NEXT: [0,8] . . . D========================eeeeeeeeeER ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
2934 # CHECK-NEXT: [0,9] . . . D=======================eE-------R add x0, x27, #1
2936 # CHECK: Average Wait times (based on the timeline view):
2937 # CHECK-NEXT: [0]: Executions
2938 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2939 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2940 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2942 # CHECK: [0] [1] [2] [3]
2943 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
2944 # CHECK-NEXT: 1. 1 1.0 1.0 6.0 add x0, x27, #1
2945 # CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
2946 # CHECK-NEXT: 3. 1 6.0 0.0 7.0 add x0, x27, #1
2947 # CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
2948 # CHECK-NEXT: 5. 1 12.0 0.0 7.0 add x0, x27, #1
2949 # CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
2950 # CHECK-NEXT: 7. 1 18.0 0.0 7.0 add x0, x27, #1
2951 # CHECK-NEXT: 8. 1 25.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
2952 # CHECK-NEXT: 9. 1 24.0 0.0 7.0 add x0, x27, #1
2953 # CHECK-NEXT: 1 12.6 0.2 3.4 <total>
2955 # CHECK: [39] Code Region - G40
2957 # CHECK: Iterations: 100
2958 # CHECK-NEXT: Instructions: 1000
2959 # CHECK-NEXT: Total Cycles: 4303
2960 # CHECK-NEXT: Total uOps: 3100
2962 # CHECK: Dispatch Width: 3
2963 # CHECK-NEXT: uOps Per Cycle: 0.72
2964 # CHECK-NEXT: IPC: 0.23
2965 # CHECK-NEXT: Block RThroughput: 10.3
2967 # CHECK: Timeline view:
2968 # CHECK-NEXT: 0123456789 0123456789
2969 # CHECK-NEXT: Index 0123456789 0123456789 012345
2971 # CHECK: [0,0] DeeeeeeeeeER . . . . . . . ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
2972 # CHECK-NEXT: [0,1] . DeE------R . . . . . . . add x0, x27, #1
2973 # CHECK-NEXT: [0,2] . D======eeeeeeeeeER . . . . . ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
2974 # CHECK-NEXT: [0,3] . D=====eE-------R . . . . . add x0, x27, #1
2975 # CHECK-NEXT: [0,4] . .D============eeeeeeeeeER. . . . ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
2976 # CHECK-NEXT: [0,5] . . D===========eE-------R. . . . add x0, x27, #1
2977 # CHECK-NEXT: [0,6] . . D==================eeeeeeeeER . . ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
2978 # CHECK-NEXT: [0,7] . . D==================eE------R . . add x0, x27, #1
2979 # CHECK-NEXT: [0,8] . . .D========================eeeeeeeeER ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
2980 # CHECK-NEXT: [0,9] . . . D========================eE------R add x0, x27, #1
2982 # CHECK: Average Wait times (based on the timeline view):
2983 # CHECK-NEXT: [0]: Executions
2984 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2985 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2986 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2988 # CHECK: [0] [1] [2] [3]
2989 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
2990 # CHECK-NEXT: 1. 1 1.0 1.0 6.0 add x0, x27, #1
2991 # CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
2992 # CHECK-NEXT: 3. 1 6.0 0.0 7.0 add x0, x27, #1
2993 # CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
2994 # CHECK-NEXT: 5. 1 12.0 0.0 7.0 add x0, x27, #1
2995 # CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
2996 # CHECK-NEXT: 7. 1 19.0 0.0 6.0 add x0, x27, #1
2997 # CHECK-NEXT: 8. 1 25.0 0.0 0.0 ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
2998 # CHECK-NEXT: 9. 1 25.0 0.0 6.0 add x0, x27, #1
2999 # CHECK-NEXT: 1 12.8 0.2 3.2 <total>
3001 # CHECK: [40] Code Region - G41
3003 # CHECK: Iterations: 100
3004 # CHECK-NEXT: Instructions: 1000
3005 # CHECK-NEXT: Total Cycles: 2303
3006 # CHECK-NEXT: Total uOps: 3100
3008 # CHECK: Dispatch Width: 3
3009 # CHECK-NEXT: uOps Per Cycle: 1.35
3010 # CHECK-NEXT: IPC: 0.43
3011 # CHECK-NEXT: Block RThroughput: 10.3
3013 # CHECK: Timeline view:
3014 # CHECK-NEXT: 0123456789
3015 # CHECK-NEXT: Index 0123456789 012345
3017 # CHECK: [0,0] DeeeeeeeeeER . . . ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
3018 # CHECK-NEXT: [0,1] . DeE------R . . . add x0, x27, #1
3019 # CHECK-NEXT: [0,2] . D======eeeeeeeeeER . ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
3020 # CHECK-NEXT: [0,3] . D=====eE-------R . add x0, x27, #1
3021 # CHECK-NEXT: [0,4] . .D=====eeeeeeE-R . ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
3022 # CHECK-NEXT: [0,5] . . D=====eE-----R . add x0, x27, #1
3023 # CHECK-NEXT: [0,6] . . D=====eeeeeeeeeER. ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32
3024 # CHECK-NEXT: [0,7] . . D====eE-------R. add x0, x27, #1
3025 # CHECK-NEXT: [0,8] . . .D====eeeeeeeeER ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16
3026 # CHECK-NEXT: [0,9] . . . D====eE------R add x0, x27, #1
3028 # CHECK: Average Wait times (based on the timeline view):
3029 # CHECK-NEXT: [0]: Executions
3030 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3031 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3032 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3034 # CHECK: [0] [1] [2] [3]
3035 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
3036 # CHECK-NEXT: 1. 1 1.0 1.0 6.0 add x0, x27, #1
3037 # CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
3038 # CHECK-NEXT: 3. 1 6.0 0.0 7.0 add x0, x27, #1
3039 # CHECK-NEXT: 4. 1 6.0 1.0 1.0 ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
3040 # CHECK-NEXT: 5. 1 6.0 0.0 5.0 add x0, x27, #1
3041 # CHECK-NEXT: 6. 1 6.0 1.0 0.0 ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32
3042 # CHECK-NEXT: 7. 1 5.0 0.0 7.0 add x0, x27, #1
3043 # CHECK-NEXT: 8. 1 5.0 1.0 0.0 ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16
3044 # CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1
3045 # CHECK-NEXT: 1 4.8 0.5 3.2 <total>
3047 # CHECK: [41] Code Region - G42
3049 # CHECK: Iterations: 100
3050 # CHECK-NEXT: Instructions: 1000
3051 # CHECK-NEXT: Total Cycles: 1309
3052 # CHECK-NEXT: Total uOps: 3100
3054 # CHECK: Dispatch Width: 3
3055 # CHECK-NEXT: uOps Per Cycle: 2.37
3056 # CHECK-NEXT: IPC: 0.76
3057 # CHECK-NEXT: Block RThroughput: 10.3
3059 # CHECK: Timeline view:
3060 # CHECK-NEXT: 0123456789
3061 # CHECK-NEXT: Index 0123456789 01
3063 # CHECK: [0,0] DeeeeeeeeER . .. ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8
3064 # CHECK-NEXT: [0,1] .DeE------R . .. add x0, x27, #1
3065 # CHECK-NEXT: [0,2] . DeeeeeeeeeER . .. ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16
3066 # CHECK-NEXT: [0,3] . DeE------R . .. add x0, x27, #1
3067 # CHECK-NEXT: [0,4] . DeeeeeeeeER .. ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4
3068 # CHECK-NEXT: [0,5] . .DeE------R .. add x0, x27, #1
3069 # CHECK-NEXT: [0,6] . . DeeeeeeeeeER .. ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8
3070 # CHECK-NEXT: [0,7] . . DeE------R .. add x0, x27, #1
3071 # CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4
3072 # CHECK-NEXT: [0,9] . . . DeE------R add x0, x27, #1
3074 # CHECK: Average Wait times (based on the timeline view):
3075 # CHECK-NEXT: [0]: Executions
3076 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3077 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3078 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3080 # CHECK: [0] [1] [2] [3]
3081 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8
3082 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
3083 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16
3084 # CHECK-NEXT: 3. 1 1.0 1.0 6.0 add x0, x27, #1
3085 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4
3086 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
3087 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8
3088 # CHECK-NEXT: 7. 1 1.0 1.0 6.0 add x0, x27, #1
3089 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4
3090 # CHECK-NEXT: 9. 1 1.0 1.0 6.0 add x0, x27, #1
3091 # CHECK-NEXT: 1 1.0 0.8 3.0 <total>
3093 # CHECK: [42] Code Region - G43
3095 # CHECK: Iterations: 100
3096 # CHECK-NEXT: Instructions: 1000
3097 # CHECK-NEXT: Total Cycles: 1209
3098 # CHECK-NEXT: Total uOps: 2900
3100 # CHECK: Dispatch Width: 3
3101 # CHECK-NEXT: uOps Per Cycle: 2.40
3102 # CHECK-NEXT: IPC: 0.83
3103 # CHECK-NEXT: Block RThroughput: 9.7
3105 # CHECK: Timeline view:
3106 # CHECK-NEXT: 0123456789
3107 # CHECK-NEXT: Index 0123456789 0
3109 # CHECK: [0,0] DeeeeeeER . . . ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
3110 # CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1
3111 # CHECK-NEXT: [0,2] . DeeeeeeeeeER . . ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
3112 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
3113 # CHECK-NEXT: [0,4] . DeeeeeeeeER . ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
3114 # CHECK-NEXT: [0,5] . .DeE------R . add x0, x27, #1
3115 # CHECK-NEXT: [0,6] . . DeeeeeeeeER . ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
3116 # CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1
3117 # CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
3118 # CHECK-NEXT: [0,9] . . .DeE------R add x0, x27, #1
3120 # CHECK: Average Wait times (based on the timeline view):
3121 # CHECK-NEXT: [0]: Executions
3122 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3123 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3124 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3126 # CHECK: [0] [1] [2] [3]
3127 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
3128 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
3129 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
3130 # CHECK-NEXT: 3. 1 1.0 1.0 6.0 add x0, x27, #1
3131 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
3132 # CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1
3133 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
3134 # CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1
3135 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
3136 # CHECK-NEXT: 9. 1 1.0 1.0 6.0 add x0, x27, #1
3137 # CHECK-NEXT: 1 1.0 0.7 2.8 <total>
3139 # CHECK: [43] Code Region - G44
3141 # CHECK: Iterations: 100
3142 # CHECK-NEXT: Instructions: 1000
3143 # CHECK-NEXT: Total Cycles: 1206
3144 # CHECK-NEXT: Total uOps: 2700
3146 # CHECK: Dispatch Width: 3
3147 # CHECK-NEXT: uOps Per Cycle: 2.24
3148 # CHECK-NEXT: IPC: 0.83
3149 # CHECK-NEXT: Block RThroughput: 9.0
3151 # CHECK: Timeline view:
3152 # CHECK-NEXT: 01234567
3153 # CHECK-NEXT: Index 0123456789
3155 # CHECK: [0,0] DeeeeeeeeER . . ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
3156 # CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1
3157 # CHECK-NEXT: [0,2] . DeeeeeeeeeER . . ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
3158 # CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1
3159 # CHECK-NEXT: [0,4] . DeeeeeeeeeER. ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
3160 # CHECK-NEXT: [0,5] . . DeE------R. add x0, x27, #1
3161 # CHECK-NEXT: [0,6] . . DeeeeeE-R. ldp s1, s2, [x27], #248
3162 # CHECK-NEXT: [0,7] . . DeE----R. add x0, x27, #1
3163 # CHECK-NEXT: [0,8] . . DeeeeeER ldp d1, d2, [x27], #496
3164 # CHECK-NEXT: [0,9] . . .DeE---R add x0, x27, #1
3166 # CHECK: Average Wait times (based on the timeline view):
3167 # CHECK-NEXT: [0]: Executions
3168 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3169 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3170 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3172 # CHECK: [0] [1] [2] [3]
3173 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
3174 # CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1
3175 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
3176 # CHECK-NEXT: 3. 1 1.0 1.0 6.0 add x0, x27, #1
3177 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
3178 # CHECK-NEXT: 5. 1 1.0 1.0 6.0 add x0, x27, #1
3179 # CHECK-NEXT: 6. 1 1.0 1.0 1.0 ldp s1, s2, [x27], #248
3180 # CHECK-NEXT: 7. 1 1.0 0.0 4.0 add x0, x27, #1
3181 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ldp d1, d2, [x27], #496
3182 # CHECK-NEXT: 9. 1 1.0 0.0 3.0 add x0, x27, #1
3183 # CHECK-NEXT: 1 1.0 0.7 2.6 <total>
3185 # CHECK: [44] Code Region - G45
3187 # CHECK: Iterations: 100
3188 # CHECK-NEXT: Instructions: 1000
3189 # CHECK-NEXT: Total Cycles: 1005
3190 # CHECK-NEXT: Total uOps: 2200
3192 # CHECK: Dispatch Width: 3
3193 # CHECK-NEXT: uOps Per Cycle: 2.19
3194 # CHECK-NEXT: IPC: 1.00
3195 # CHECK-NEXT: Block RThroughput: 7.3
3197 # CHECK: Timeline view:
3199 # CHECK-NEXT: Index 0123456789
3201 # CHECK: [0,0] DeeeeeeER . . ldp q1, q2, [x27], #992
3202 # CHECK-NEXT: [0,1] .DeE----R . . add x0, x27, #1
3203 # CHECK-NEXT: [0,2] . DeeeeeER. . ldp s1, s2, [x27, #248]!
3204 # CHECK-NEXT: [0,3] . DeE---R. . add x0, x27, #1
3205 # CHECK-NEXT: [0,4] . DeeeeeER . ldp d1, d2, [x27, #496]!
3206 # CHECK-NEXT: [0,5] . DeE---R . add x0, x27, #1
3207 # CHECK-NEXT: [0,6] . .DeeeeeeER ldp q1, q2, [x27, #992]!
3208 # CHECK-NEXT: [0,7] . . DeE----R add x0, x27, #1
3209 # CHECK-NEXT: [0,8] . . DeeeeER ldp w1, w2, [x27], #248
3210 # CHECK-NEXT: [0,9] . . DeE--R add x0, x27, #1
3212 # CHECK: Average Wait times (based on the timeline view):
3213 # CHECK-NEXT: [0]: Executions
3214 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3215 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3216 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3218 # CHECK: [0] [1] [2] [3]
3219 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldp q1, q2, [x27], #992
3220 # CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1
3221 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ldp s1, s2, [x27, #248]!
3222 # CHECK-NEXT: 3. 1 1.0 0.0 3.0 add x0, x27, #1
3223 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ldp d1, d2, [x27, #496]!
3224 # CHECK-NEXT: 5. 1 1.0 0.0 3.0 add x0, x27, #1
3225 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ldp q1, q2, [x27, #992]!
3226 # CHECK-NEXT: 7. 1 1.0 0.0 4.0 add x0, x27, #1
3227 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ldp w1, w2, [x27], #248
3228 # CHECK-NEXT: 9. 1 1.0 0.0 2.0 add x0, x27, #1
3229 # CHECK-NEXT: 1 1.0 0.5 1.6 <total>
3231 # CHECK: [45] Code Region - G46
3233 # CHECK: Iterations: 100
3234 # CHECK-NEXT: Instructions: 1000
3235 # CHECK-NEXT: Total Cycles: 1006
3236 # CHECK-NEXT: Total uOps: 2400
3238 # CHECK: Dispatch Width: 3
3239 # CHECK-NEXT: uOps Per Cycle: 2.39
3240 # CHECK-NEXT: IPC: 0.99
3241 # CHECK-NEXT: Block RThroughput: 8.0
3243 # CHECK: Timeline view:
3244 # CHECK-NEXT: 012345
3245 # CHECK-NEXT: Index 0123456789
3247 # CHECK: [0,0] DeeeeER . . ldp x1, x2, [x27], #496
3248 # CHECK-NEXT: [0,1] .DeE--R . . add x0, x27, #1
3249 # CHECK-NEXT: [0,2] . DeeeeER . . ldp w1, w2, [x27, #248]!
3250 # CHECK-NEXT: [0,3] . DeE--R . . add x0, x27, #1
3251 # CHECK-NEXT: [0,4] . DeeeeER . ldp x1, x2, [x27, #496]!
3252 # CHECK-NEXT: [0,5] . DeE--R . add x0, x27, #1
3253 # CHECK-NEXT: [0,6] . .DeeeeeER . ldpsw x1, x2, [x27], #248
3254 # CHECK-NEXT: [0,7] . . DeE---R . add x0, x27, #1
3255 # CHECK-NEXT: [0,8] . . DeeeeeER ldpsw x1, x2, [x27, #248]!
3256 # CHECK-NEXT: [0,9] . . DeE---R add x0, x27, #1
3258 # CHECK: Average Wait times (based on the timeline view):
3259 # CHECK-NEXT: [0]: Executions
3260 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3261 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3262 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3264 # CHECK: [0] [1] [2] [3]
3265 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldp x1, x2, [x27], #496
3266 # CHECK-NEXT: 1. 1 1.0 0.0 2.0 add x0, x27, #1
3267 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 ldp w1, w2, [x27, #248]!
3268 # CHECK-NEXT: 3. 1 1.0 0.0 2.0 add x0, x27, #1
3269 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 ldp x1, x2, [x27, #496]!
3270 # CHECK-NEXT: 5. 1 1.0 0.0 2.0 add x0, x27, #1
3271 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 ldpsw x1, x2, [x27], #248
3272 # CHECK-NEXT: 7. 1 1.0 0.0 3.0 add x0, x27, #1
3273 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 ldpsw x1, x2, [x27, #248]!
3274 # CHECK-NEXT: 9. 1 1.0 0.0 3.0 add x0, x27, #1
3275 # CHECK-NEXT: 1 1.0 0.5 1.2 <total>
3277 # CHECK: [46] Code Region - G47
3279 # CHECK: Iterations: 100
3280 # CHECK-NEXT: Instructions: 1000
3281 # CHECK-NEXT: Total Cycles: 2504
3282 # CHECK-NEXT: Total uOps: 1500
3284 # CHECK: Dispatch Width: 3
3285 # CHECK-NEXT: uOps Per Cycle: 0.60
3286 # CHECK-NEXT: IPC: 0.40
3287 # CHECK-NEXT: Block RThroughput: 5.0
3289 # CHECK: Timeline view:
3290 # CHECK-NEXT: 0123456789
3291 # CHECK-NEXT: Index 0123456789 012345678
3293 # CHECK: [0,0] DeeeeeER . . . . . ldr b1, [x27], #254
3294 # CHECK-NEXT: [0,1] D=====eER . . . . . add x0, x27, #1
3295 # CHECK-NEXT: [0,2] .D====eeeeeER . . . . ldr h1, [x27], #254
3296 # CHECK-NEXT: [0,3] .D=========eER . . . . add x0, x27, #1
3297 # CHECK-NEXT: [0,4] . D========eeeeeER . . . ldr s1, [x27], #254
3298 # CHECK-NEXT: [0,5] . D=============eER . . . add x0, x27, #1
3299 # CHECK-NEXT: [0,6] . D============eeeeeER . . ldr d1, [x27], #254
3300 # CHECK-NEXT: [0,7] . D=================eER . . add x0, x27, #1
3301 # CHECK-NEXT: [0,8] . D================eeeeeER. ldr q1, [x27], #254
3302 # CHECK-NEXT: [0,9] . D=====================eER add x0, x27, #1
3304 # CHECK: Average Wait times (based on the timeline view):
3305 # CHECK-NEXT: [0]: Executions
3306 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3307 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3308 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3310 # CHECK: [0] [1] [2] [3]
3311 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr b1, [x27], #254
3312 # CHECK-NEXT: 1. 1 6.0 0.0 0.0 add x0, x27, #1
3313 # CHECK-NEXT: 2. 1 5.0 0.0 0.0 ldr h1, [x27], #254
3314 # CHECK-NEXT: 3. 1 10.0 0.0 0.0 add x0, x27, #1
3315 # CHECK-NEXT: 4. 1 9.0 0.0 0.0 ldr s1, [x27], #254
3316 # CHECK-NEXT: 5. 1 14.0 0.0 0.0 add x0, x27, #1
3317 # CHECK-NEXT: 6. 1 13.0 0.0 0.0 ldr d1, [x27], #254
3318 # CHECK-NEXT: 7. 1 18.0 0.0 0.0 add x0, x27, #1
3319 # CHECK-NEXT: 8. 1 17.0 0.0 0.0 ldr q1, [x27], #254
3320 # CHECK-NEXT: 9. 1 22.0 0.0 0.0 add x0, x27, #1
3321 # CHECK-NEXT: 1 11.5 0.1 0.0 <total>
3323 # CHECK: [47] Code Region - G48
3325 # CHECK: Iterations: 100
3326 # CHECK-NEXT: Instructions: 1000
3327 # CHECK-NEXT: Total Cycles: 507
3328 # CHECK-NEXT: Total uOps: 1500
3330 # CHECK: Dispatch Width: 3
3331 # CHECK-NEXT: uOps Per Cycle: 2.96
3332 # CHECK-NEXT: IPC: 1.97
3333 # CHECK-NEXT: Block RThroughput: 5.0
3335 # CHECK: Timeline view:
3337 # CHECK-NEXT: Index 0123456789
3339 # CHECK: [0,0] DeeeeeER .. ldr b1, [x27, #254]!
3340 # CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1
3341 # CHECK-NEXT: [0,2] .DeeeeeER .. ldr h1, [x27, #254]!
3342 # CHECK-NEXT: [0,3] .D=eE---R .. add x0, x27, #1
3343 # CHECK-NEXT: [0,4] . DeeeeeER.. ldr s1, [x27, #254]!
3344 # CHECK-NEXT: [0,5] . D=eE---R.. add x0, x27, #1
3345 # CHECK-NEXT: [0,6] . DeeeeeER. ldr d1, [x27, #254]!
3346 # CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1
3347 # CHECK-NEXT: [0,8] . DeeeeeER ldr q1, [x27, #254]!
3348 # CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1
3350 # CHECK: Average Wait times (based on the timeline view):
3351 # CHECK-NEXT: [0]: Executions
3352 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3353 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3354 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3356 # CHECK: [0] [1] [2] [3]
3357 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr b1, [x27, #254]!
3358 # CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1
3359 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldr h1, [x27, #254]!
3360 # CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1
3361 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldr s1, [x27, #254]!
3362 # CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1
3363 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 ldr d1, [x27, #254]!
3364 # CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1
3365 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 ldr q1, [x27, #254]!
3366 # CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1
3367 # CHECK-NEXT: 1 1.5 0.1 1.5 <total>
3369 # CHECK: [48] Code Region - G49
3371 # CHECK: Iterations: 100
3372 # CHECK-NEXT: Instructions: 1000
3373 # CHECK-NEXT: Total Cycles: 506
3374 # CHECK-NEXT: Total uOps: 1500
3376 # CHECK: Dispatch Width: 3
3377 # CHECK-NEXT: uOps Per Cycle: 2.96
3378 # CHECK-NEXT: IPC: 1.98
3379 # CHECK-NEXT: Block RThroughput: 5.0
3381 # CHECK: Timeline view:
3383 # CHECK-NEXT: Index 0123456789
3385 # CHECK: [0,0] DeeeeER . ldr w1, [x27], #254
3386 # CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1
3387 # CHECK-NEXT: [0,2] .DeeeeER . ldr x1, [x27], #254
3388 # CHECK-NEXT: [0,3] .D=eE--R . add x0, x27, #1
3389 # CHECK-NEXT: [0,4] . DeeeeER . ldr w1, [x27, #254]!
3390 # CHECK-NEXT: [0,5] . D=eE--R . add x0, x27, #1
3391 # CHECK-NEXT: [0,6] . DeeeeER. ldr x1, [x27, #254]!
3392 # CHECK-NEXT: [0,7] . D=eE--R. add x0, x27, #1
3393 # CHECK-NEXT: [0,8] . DeeeeER ldrb w1, [x27], #254
3394 # CHECK-NEXT: [0,9] . D=eE--R add x0, x27, #1
3396 # CHECK: Average Wait times (based on the timeline view):
3397 # CHECK-NEXT: [0]: Executions
3398 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3399 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3400 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3402 # CHECK: [0] [1] [2] [3]
3403 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr w1, [x27], #254
3404 # CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1
3405 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldr x1, [x27], #254
3406 # CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1
3407 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldr w1, [x27, #254]!
3408 # CHECK-NEXT: 5. 1 2.0 0.0 2.0 add x0, x27, #1
3409 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 ldr x1, [x27, #254]!
3410 # CHECK-NEXT: 7. 1 2.0 0.0 2.0 add x0, x27, #1
3411 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 ldrb w1, [x27], #254
3412 # CHECK-NEXT: 9. 1 2.0 0.0 2.0 add x0, x27, #1
3413 # CHECK-NEXT: 1 1.5 0.1 1.0 <total>
3415 # CHECK: [49] Code Region - G50
3417 # CHECK: Iterations: 100
3418 # CHECK-NEXT: Instructions: 1000
3419 # CHECK-NEXT: Total Cycles: 506
3420 # CHECK-NEXT: Total uOps: 1500
3422 # CHECK: Dispatch Width: 3
3423 # CHECK-NEXT: uOps Per Cycle: 2.96
3424 # CHECK-NEXT: IPC: 1.98
3425 # CHECK-NEXT: Block RThroughput: 5.0
3427 # CHECK: Timeline view:
3429 # CHECK-NEXT: Index 0123456789
3431 # CHECK: [0,0] DeeeeER . ldrb w1, [x27, #254]!
3432 # CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1
3433 # CHECK-NEXT: [0,2] .DeeeeER . ldrh w1, [x27], #254
3434 # CHECK-NEXT: [0,3] .D=eE--R . add x0, x27, #1
3435 # CHECK-NEXT: [0,4] . DeeeeER . ldrh w1, [x27, #254]!
3436 # CHECK-NEXT: [0,5] . D=eE--R . add x0, x27, #1
3437 # CHECK-NEXT: [0,6] . DeeeeER. ldrsb w1, [x27], #254
3438 # CHECK-NEXT: [0,7] . D=eE--R. add x0, x27, #1
3439 # CHECK-NEXT: [0,8] . DeeeeER ldrsb x1, [x27], #254
3440 # CHECK-NEXT: [0,9] . D=eE--R add x0, x27, #1
3442 # CHECK: Average Wait times (based on the timeline view):
3443 # CHECK-NEXT: [0]: Executions
3444 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3445 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3446 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3448 # CHECK: [0] [1] [2] [3]
3449 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrb w1, [x27, #254]!
3450 # CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1
3451 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldrh w1, [x27], #254
3452 # CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1
3453 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldrh w1, [x27, #254]!
3454 # CHECK-NEXT: 5. 1 2.0 0.0 2.0 add x0, x27, #1
3455 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 ldrsb w1, [x27], #254
3456 # CHECK-NEXT: 7. 1 2.0 0.0 2.0 add x0, x27, #1
3457 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 ldrsb x1, [x27], #254
3458 # CHECK-NEXT: 9. 1 2.0 0.0 2.0 add x0, x27, #1
3459 # CHECK-NEXT: 1 1.5 0.1 1.0 <total>
3461 # CHECK: [50] Code Region - G51
3463 # CHECK: Iterations: 100
3464 # CHECK-NEXT: Instructions: 1000
3465 # CHECK-NEXT: Total Cycles: 506
3466 # CHECK-NEXT: Total uOps: 1500
3468 # CHECK: Dispatch Width: 3
3469 # CHECK-NEXT: uOps Per Cycle: 2.96
3470 # CHECK-NEXT: IPC: 1.98
3471 # CHECK-NEXT: Block RThroughput: 5.0
3473 # CHECK: Timeline view:
3475 # CHECK-NEXT: Index 0123456789
3477 # CHECK: [0,0] DeeeeER . ldrsb w1, [x27, #254]!
3478 # CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1
3479 # CHECK-NEXT: [0,2] .DeeeeER . ldrsb x1, [x27, #254]!
3480 # CHECK-NEXT: [0,3] .D=eE--R . add x0, x27, #1
3481 # CHECK-NEXT: [0,4] . DeeeeER . ldrsh w1, [x27], #254
3482 # CHECK-NEXT: [0,5] . D=eE--R . add x0, x27, #1
3483 # CHECK-NEXT: [0,6] . DeeeeER. ldrsh x1, [x27], #254
3484 # CHECK-NEXT: [0,7] . D=eE--R. add x0, x27, #1
3485 # CHECK-NEXT: [0,8] . DeeeeER ldrsh w1, [x27, #254]!
3486 # CHECK-NEXT: [0,9] . D=eE--R add x0, x27, #1
3488 # CHECK: Average Wait times (based on the timeline view):
3489 # CHECK-NEXT: [0]: Executions
3490 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3491 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3492 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3494 # CHECK: [0] [1] [2] [3]
3495 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrsb w1, [x27, #254]!
3496 # CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1
3497 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldrsb x1, [x27, #254]!
3498 # CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1
3499 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldrsh w1, [x27], #254
3500 # CHECK-NEXT: 5. 1 2.0 0.0 2.0 add x0, x27, #1
3501 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 ldrsh x1, [x27], #254
3502 # CHECK-NEXT: 7. 1 2.0 0.0 2.0 add x0, x27, #1
3503 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 ldrsh w1, [x27, #254]!
3504 # CHECK-NEXT: 9. 1 2.0 0.0 2.0 add x0, x27, #1
3505 # CHECK-NEXT: 1 1.5 0.1 1.0 <total>
3507 # CHECK: [51] Code Region - G52
3509 # CHECK: Iterations: 100
3510 # CHECK-NEXT: Instructions: 1000
3511 # CHECK-NEXT: Total Cycles: 603
3512 # CHECK-NEXT: Total uOps: 1600
3514 # CHECK: Dispatch Width: 3
3515 # CHECK-NEXT: uOps Per Cycle: 2.65
3516 # CHECK-NEXT: IPC: 1.66
3517 # CHECK-NEXT: Block RThroughput: 5.3
3519 # CHECK: Timeline view:
3520 # CHECK-NEXT: Index 012345678
3522 # CHECK: [0,0] DeeeeER . ldrsh x1, [x27, #254]!
3523 # CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1
3524 # CHECK-NEXT: [0,2] .DeeeeER. ldrsw x1, [x27], #254
3525 # CHECK-NEXT: [0,3] .D=eE--R. add x0, x27, #1
3526 # CHECK-NEXT: [0,4] . DeeeeER ldrsw x1, [x27, #254]!
3527 # CHECK-NEXT: [0,5] . D=eE--R add x0, x27, #1
3528 # CHECK-NEXT: [0,6] . DeE--R st1 { v1.1d }, [x27], #8
3529 # CHECK-NEXT: [0,7] . D=eE-R add x0, x27, #1
3530 # CHECK-NEXT: [0,8] . DeeER st1 { v1.2d }, [x27], #16
3531 # CHECK-NEXT: [0,9] . DeER add x0, x27, #1
3533 # CHECK: Average Wait times (based on the timeline view):
3534 # CHECK-NEXT: [0]: Executions
3535 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3536 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3537 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3539 # CHECK: [0] [1] [2] [3]
3540 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrsh x1, [x27, #254]!
3541 # CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1
3542 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldrsw x1, [x27], #254
3543 # CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1
3544 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldrsw x1, [x27, #254]!
3545 # CHECK-NEXT: 5. 1 2.0 0.0 2.0 add x0, x27, #1
3546 # CHECK-NEXT: 6. 1 1.0 0.0 2.0 st1 { v1.1d }, [x27], #8
3547 # CHECK-NEXT: 7. 1 2.0 0.0 1.0 add x0, x27, #1
3548 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 st1 { v1.2d }, [x27], #16
3549 # CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1
3550 # CHECK-NEXT: 1 1.4 0.1 0.9 <total>
3552 # CHECK: [52] Code Region - G53
3554 # CHECK: Iterations: 100
3555 # CHECK-NEXT: Instructions: 1000
3556 # CHECK-NEXT: Total Cycles: 703
3557 # CHECK-NEXT: Total uOps: 1700
3559 # CHECK: Dispatch Width: 3
3560 # CHECK-NEXT: uOps Per Cycle: 2.42
3561 # CHECK-NEXT: IPC: 1.42
3562 # CHECK-NEXT: Block RThroughput: 7.0
3564 # CHECK: Timeline view:
3565 # CHECK-NEXT: Index 0123456789
3567 # CHECK: [0,0] DeER . . st1 { v1.2s }, [x27], #8
3568 # CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1
3569 # CHECK-NEXT: [0,2] .DeER. . st1 { v1.4h }, [x27], #8
3570 # CHECK-NEXT: [0,3] .D=eER . add x0, x27, #1
3571 # CHECK-NEXT: [0,4] . DeeER . st1 { v1.4s }, [x27], #16
3572 # CHECK-NEXT: [0,5] . DeER . add x0, x27, #1
3573 # CHECK-NEXT: [0,6] . D=eER . st1 { v1.8b }, [x27], #8
3574 # CHECK-NEXT: [0,7] . D=eER. add x0, x27, #1
3575 # CHECK-NEXT: [0,8] . DeeER st1 { v1.8h }, [x27], #16
3576 # CHECK-NEXT: [0,9] . .DeER add x0, x27, #1
3578 # CHECK: Average Wait times (based on the timeline view):
3579 # CHECK-NEXT: [0]: Executions
3580 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3581 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3582 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3584 # CHECK: [0] [1] [2] [3]
3585 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2s }, [x27], #8
3586 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1
3587 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 st1 { v1.4h }, [x27], #8
3588 # CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1
3589 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.4s }, [x27], #16
3590 # CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1
3591 # CHECK-NEXT: 6. 1 2.0 1.0 0.0 st1 { v1.8b }, [x27], #8
3592 # CHECK-NEXT: 7. 1 2.0 0.0 0.0 add x0, x27, #1
3593 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 st1 { v1.8h }, [x27], #16
3594 # CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1
3595 # CHECK-NEXT: 1 1.4 0.2 0.0 <total>
3597 # CHECK: [53] Code Region - G54
3599 # CHECK: Iterations: 100
3600 # CHECK-NEXT: Instructions: 1000
3601 # CHECK-NEXT: Total Cycles: 704
3602 # CHECK-NEXT: Total uOps: 1700
3604 # CHECK: Dispatch Width: 3
3605 # CHECK-NEXT: uOps Per Cycle: 2.41
3606 # CHECK-NEXT: IPC: 1.42
3607 # CHECK-NEXT: Block RThroughput: 7.0
3609 # CHECK: Timeline view:
3611 # CHECK-NEXT: Index 0123456789
3613 # CHECK: [0,0] DeeER. . st1 { v1.16b }, [x27], #16
3614 # CHECK-NEXT: [0,1] .DeER. . add x0, x27, #1
3615 # CHECK-NEXT: [0,2] .D=eER . st1 { v1.1d }, [x27], x28
3616 # CHECK-NEXT: [0,3] . D=eER . add x0, x27, #1
3617 # CHECK-NEXT: [0,4] . DeeER . st1 { v1.2d }, [x27], x28
3618 # CHECK-NEXT: [0,5] . DeER . add x0, x27, #1
3619 # CHECK-NEXT: [0,6] . D=eER . st1 { v1.2s }, [x27], x28
3620 # CHECK-NEXT: [0,7] . D=eER. add x0, x27, #1
3621 # CHECK-NEXT: [0,8] . D=eER. st1 { v1.4h }, [x27], x28
3622 # CHECK-NEXT: [0,9] . .D=eER add x0, x27, #1
3624 # CHECK: Average Wait times (based on the timeline view):
3625 # CHECK-NEXT: [0]: Executions
3626 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3627 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3628 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3630 # CHECK: [0] [1] [2] [3]
3631 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.16b }, [x27], #16
3632 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
3633 # CHECK-NEXT: 2. 1 2.0 1.0 0.0 st1 { v1.1d }, [x27], x28
3634 # CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1
3635 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.2d }, [x27], x28
3636 # CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1
3637 # CHECK-NEXT: 6. 1 2.0 1.0 0.0 st1 { v1.2s }, [x27], x28
3638 # CHECK-NEXT: 7. 1 2.0 0.0 0.0 add x0, x27, #1
3639 # CHECK-NEXT: 8. 1 2.0 0.0 0.0 st1 { v1.4h }, [x27], x28
3640 # CHECK-NEXT: 9. 1 2.0 0.0 0.0 add x0, x27, #1
3641 # CHECK-NEXT: 1 1.6 0.3 0.0 <total>
3643 # CHECK: [54] Code Region - G55
3645 # CHECK: Iterations: 100
3646 # CHECK-NEXT: Instructions: 1000
3647 # CHECK-NEXT: Total Cycles: 903
3648 # CHECK-NEXT: Total uOps: 1900
3650 # CHECK: Dispatch Width: 3
3651 # CHECK-NEXT: uOps Per Cycle: 2.10
3652 # CHECK-NEXT: IPC: 1.11
3653 # CHECK-NEXT: Block RThroughput: 9.0
3655 # CHECK: Timeline view:
3657 # CHECK-NEXT: Index 0123456789
3659 # CHECK: [0,0] DeeER. .. st1 { v1.4s }, [x27], x28
3660 # CHECK-NEXT: [0,1] .DeER. .. add x0, x27, #1
3661 # CHECK-NEXT: [0,2] .D=eER .. st1 { v1.8b }, [x27], x28
3662 # CHECK-NEXT: [0,3] . D=eER .. add x0, x27, #1
3663 # CHECK-NEXT: [0,4] . DeeER .. st1 { v1.8h }, [x27], x28
3664 # CHECK-NEXT: [0,5] . DeER .. add x0, x27, #1
3665 # CHECK-NEXT: [0,6] . DeeER.. st1 { v1.16b }, [x27], x28
3666 # CHECK-NEXT: [0,7] . .DeER.. add x0, x27, #1
3667 # CHECK-NEXT: [0,8] . . DeeER st1 { v1.1d, v2.1d }, [x27], #16
3668 # CHECK-NEXT: [0,9] . . DeER add x0, x27, #1
3670 # CHECK: Average Wait times (based on the timeline view):
3671 # CHECK-NEXT: [0]: Executions
3672 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3673 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3674 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3676 # CHECK: [0] [1] [2] [3]
3677 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4s }, [x27], x28
3678 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
3679 # CHECK-NEXT: 2. 1 2.0 1.0 0.0 st1 { v1.8b }, [x27], x28
3680 # CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1
3681 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.8h }, [x27], x28
3682 # CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1
3683 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 st1 { v1.16b }, [x27], x28
3684 # CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1
3685 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 st1 { v1.1d, v2.1d }, [x27], #16
3686 # CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1
3687 # CHECK-NEXT: 1 1.2 0.4 0.0 <total>
3689 # CHECK: [55] Code Region - G56
3691 # CHECK: Iterations: 100
3692 # CHECK-NEXT: Instructions: 1000
3693 # CHECK-NEXT: Total Cycles: 1403
3694 # CHECK-NEXT: Total uOps: 2400
3696 # CHECK: Dispatch Width: 3
3697 # CHECK-NEXT: uOps Per Cycle: 1.71
3698 # CHECK-NEXT: IPC: 0.71
3699 # CHECK-NEXT: Block RThroughput: 14.0
3701 # CHECK: Timeline view:
3702 # CHECK-NEXT: 0123456
3703 # CHECK-NEXT: Index 0123456789
3705 # CHECK: [0,0] DeeeeER . .. st1 { v1.2d, v2.2d }, [x27], #32
3706 # CHECK-NEXT: [0,1] .DeE--R . .. add x0, x27, #1
3707 # CHECK-NEXT: [0,2] . D==eeER . .. st1 { v1.2s, v2.2s }, [x27], #16
3708 # CHECK-NEXT: [0,3] . D==eER . .. add x0, x27, #1
3709 # CHECK-NEXT: [0,4] . D==eeER .. st1 { v1.4h, v2.4h }, [x27], #16
3710 # CHECK-NEXT: [0,5] . D==eER .. add x0, x27, #1
3711 # CHECK-NEXT: [0,6] . .D==eeeeER.. st1 { v1.4s, v2.4s }, [x27], #32
3712 # CHECK-NEXT: [0,7] . . D==eE--R.. add x0, x27, #1
3713 # CHECK-NEXT: [0,8] . . D====eeER st1 { v1.8b, v2.8b }, [x27], #16
3714 # CHECK-NEXT: [0,9] . . D====eER add x0, x27, #1
3716 # CHECK: Average Wait times (based on the timeline view):
3717 # CHECK-NEXT: [0]: Executions
3718 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3719 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3720 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3722 # CHECK: [0] [1] [2] [3]
3723 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2d, v2.2d }, [x27], #32
3724 # CHECK-NEXT: 1. 1 1.0 0.0 2.0 add x0, x27, #1
3725 # CHECK-NEXT: 2. 1 3.0 3.0 0.0 st1 { v1.2s, v2.2s }, [x27], #16
3726 # CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1
3727 # CHECK-NEXT: 4. 1 3.0 1.0 0.0 st1 { v1.4h, v2.4h }, [x27], #16
3728 # CHECK-NEXT: 5. 1 3.0 0.0 0.0 add x0, x27, #1
3729 # CHECK-NEXT: 6. 1 3.0 1.0 0.0 st1 { v1.4s, v2.4s }, [x27], #32
3730 # CHECK-NEXT: 7. 1 3.0 0.0 2.0 add x0, x27, #1
3731 # CHECK-NEXT: 8. 1 5.0 3.0 0.0 st1 { v1.8b, v2.8b }, [x27], #16
3732 # CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1
3733 # CHECK-NEXT: 1 3.0 0.9 0.4 <total>
3735 # CHECK: [56] Code Region - G57
3737 # CHECK: Iterations: 100
3738 # CHECK-NEXT: Instructions: 1000
3739 # CHECK-NEXT: Total Cycles: 1603
3740 # CHECK-NEXT: Total uOps: 2600
3742 # CHECK: Dispatch Width: 3
3743 # CHECK-NEXT: uOps Per Cycle: 1.62
3744 # CHECK-NEXT: IPC: 0.62
3745 # CHECK-NEXT: Block RThroughput: 16.0
3747 # CHECK: Timeline view:
3748 # CHECK-NEXT: 012345678
3749 # CHECK-NEXT: Index 0123456789
3751 # CHECK: [0,0] DeeeeER . . . st1 { v1.8h, v2.8h }, [x27], #32
3752 # CHECK-NEXT: [0,1] .DeE--R . . . add x0, x27, #1
3753 # CHECK-NEXT: [0,2] . D==eeeeER . . st1 { v1.16b, v2.16b }, [x27], #32
3754 # CHECK-NEXT: [0,3] . D==eE--R . . add x0, x27, #1
3755 # CHECK-NEXT: [0,4] . D====eeER . . st1 { v1.1d, v2.1d }, [x27], x28
3756 # CHECK-NEXT: [0,5] . D====eER . . add x0, x27, #1
3757 # CHECK-NEXT: [0,6] . .D====eeeeER . st1 { v1.2d, v2.2d }, [x27], x28
3758 # CHECK-NEXT: [0,7] . . D====eE--R . add x0, x27, #1
3759 # CHECK-NEXT: [0,8] . . D======eeER st1 { v1.2s, v2.2s }, [x27], x28
3760 # CHECK-NEXT: [0,9] . . D======eER add x0, x27, #1
3762 # CHECK: Average Wait times (based on the timeline view):
3763 # CHECK-NEXT: [0]: Executions
3764 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3765 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3766 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3768 # CHECK: [0] [1] [2] [3]
3769 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8h, v2.8h }, [x27], #32
3770 # CHECK-NEXT: 1. 1 1.0 0.0 2.0 add x0, x27, #1
3771 # CHECK-NEXT: 2. 1 3.0 3.0 0.0 st1 { v1.16b, v2.16b }, [x27], #32
3772 # CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1
3773 # CHECK-NEXT: 4. 1 5.0 3.0 0.0 st1 { v1.1d, v2.1d }, [x27], x28
3774 # CHECK-NEXT: 5. 1 5.0 0.0 0.0 add x0, x27, #1
3775 # CHECK-NEXT: 6. 1 5.0 1.0 0.0 st1 { v1.2d, v2.2d }, [x27], x28
3776 # CHECK-NEXT: 7. 1 5.0 0.0 2.0 add x0, x27, #1
3777 # CHECK-NEXT: 8. 1 7.0 3.0 0.0 st1 { v1.2s, v2.2s }, [x27], x28
3778 # CHECK-NEXT: 9. 1 7.0 0.0 0.0 add x0, x27, #1
3779 # CHECK-NEXT: 1 4.2 1.1 0.6 <total>
3781 # CHECK: [57] Code Region - G58
3783 # CHECK: Iterations: 100
3784 # CHECK-NEXT: Instructions: 1000
3785 # CHECK-NEXT: Total Cycles: 1603
3786 # CHECK-NEXT: Total uOps: 2600
3788 # CHECK: Dispatch Width: 3
3789 # CHECK-NEXT: uOps Per Cycle: 1.62
3790 # CHECK-NEXT: IPC: 0.62
3791 # CHECK-NEXT: Block RThroughput: 16.0
3793 # CHECK: Timeline view:
3794 # CHECK-NEXT: 012345678
3795 # CHECK-NEXT: Index 0123456789
3797 # CHECK: [0,0] DeeER. . . . st1 { v1.4h, v2.4h }, [x27], x28
3798 # CHECK-NEXT: [0,1] .DeER. . . . add x0, x27, #1
3799 # CHECK-NEXT: [0,2] . DeeeeER . . . st1 { v1.4s, v2.4s }, [x27], x28
3800 # CHECK-NEXT: [0,3] . DeE--R . . . add x0, x27, #1
3801 # CHECK-NEXT: [0,4] . D==eeER . . st1 { v1.8b, v2.8b }, [x27], x28
3802 # CHECK-NEXT: [0,5] . D==eER . . add x0, x27, #1
3803 # CHECK-NEXT: [0,6] . .D==eeeeER. . st1 { v1.8h, v2.8h }, [x27], x28
3804 # CHECK-NEXT: [0,7] . . D==eE--R. . add x0, x27, #1
3805 # CHECK-NEXT: [0,8] . . D====eeeeER st1 { v1.16b, v2.16b }, [x27], x28
3806 # CHECK-NEXT: [0,9] . . D====eE--R add x0, x27, #1
3808 # CHECK: Average Wait times (based on the timeline view):
3809 # CHECK-NEXT: [0]: Executions
3810 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3811 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3812 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3814 # CHECK: [0] [1] [2] [3]
3815 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4h, v2.4h }, [x27], x28
3816 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
3817 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 st1 { v1.4s, v2.4s }, [x27], x28
3818 # CHECK-NEXT: 3. 1 1.0 0.0 2.0 add x0, x27, #1
3819 # CHECK-NEXT: 4. 1 3.0 3.0 0.0 st1 { v1.8b, v2.8b }, [x27], x28
3820 # CHECK-NEXT: 5. 1 3.0 0.0 0.0 add x0, x27, #1
3821 # CHECK-NEXT: 6. 1 3.0 1.0 0.0 st1 { v1.8h, v2.8h }, [x27], x28
3822 # CHECK-NEXT: 7. 1 3.0 0.0 2.0 add x0, x27, #1
3823 # CHECK-NEXT: 8. 1 5.0 3.0 0.0 st1 { v1.16b, v2.16b }, [x27], x28
3824 # CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1
3825 # CHECK-NEXT: 1 2.6 0.9 0.6 <total>
3827 # CHECK: [58] Code Region - G59
3829 # CHECK: Iterations: 100
3830 # CHECK-NEXT: Instructions: 1000
3831 # CHECK-NEXT: Total Cycles: 2103
3832 # CHECK-NEXT: Total uOps: 3100
3834 # CHECK: Dispatch Width: 3
3835 # CHECK-NEXT: uOps Per Cycle: 1.47
3836 # CHECK-NEXT: IPC: 0.48
3837 # CHECK-NEXT: Block RThroughput: 21.0
3839 # CHECK: Timeline view:
3840 # CHECK-NEXT: 0123456789
3841 # CHECK-NEXT: Index 0123456789 0123
3843 # CHECK: [0,0] DeeeER . . . . st1 { v1.1d, v2.1d, v3.1d }, [x27], #24
3844 # CHECK-NEXT: [0,1] .DeE-R . . . . add x0, x27, #1
3845 # CHECK-NEXT: [0,2] . D=eeeeeeER . . . st1 { v1.2d, v2.2d, v3.2d }, [x27], #48
3846 # CHECK-NEXT: [0,3] . DeE----R . . . add x0, x27, #1
3847 # CHECK-NEXT: [0,4] . D====eeeER. . . st1 { v1.2s, v2.2s, v3.2s }, [x27], #24
3848 # CHECK-NEXT: [0,5] . .D====eE-R. . . add x0, x27, #1
3849 # CHECK-NEXT: [0,6] . . D=====eeeER . . st1 { v1.4h, v2.4h, v3.4h }, [x27], #24
3850 # CHECK-NEXT: [0,7] . . D=====eE-R . . add x0, x27, #1
3851 # CHECK-NEXT: [0,8] . . D======eeeeeeER st1 { v1.4s, v2.4s, v3.4s }, [x27], #48
3852 # CHECK-NEXT: [0,9] . . .D=====eE----R add x0, x27, #1
3854 # CHECK: Average Wait times (based on the timeline view):
3855 # CHECK-NEXT: [0]: Executions
3856 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3857 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3858 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3860 # CHECK: [0] [1] [2] [3]
3861 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.1d, v2.1d, v3.1d }, [x27], #24
3862 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
3863 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 st1 { v1.2d, v2.2d, v3.2d }, [x27], #48
3864 # CHECK-NEXT: 3. 1 1.0 0.0 4.0 add x0, x27, #1
3865 # CHECK-NEXT: 4. 1 5.0 5.0 0.0 st1 { v1.2s, v2.2s, v3.2s }, [x27], #24
3866 # CHECK-NEXT: 5. 1 5.0 0.0 1.0 add x0, x27, #1
3867 # CHECK-NEXT: 6. 1 6.0 2.0 0.0 st1 { v1.4h, v2.4h, v3.4h }, [x27], #24
3868 # CHECK-NEXT: 7. 1 6.0 0.0 1.0 add x0, x27, #1
3869 # CHECK-NEXT: 8. 1 7.0 2.0 0.0 st1 { v1.4s, v2.4s, v3.4s }, [x27], #48
3870 # CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1
3871 # CHECK-NEXT: 1 4.0 1.2 1.1 <total>
3873 # CHECK: [59] Code Region - G60
3875 # CHECK: Iterations: 100
3876 # CHECK-NEXT: Instructions: 1000
3877 # CHECK-NEXT: Total Cycles: 2403
3878 # CHECK-NEXT: Total uOps: 3400
3880 # CHECK: Dispatch Width: 3
3881 # CHECK-NEXT: uOps Per Cycle: 1.41
3882 # CHECK-NEXT: IPC: 0.42
3883 # CHECK-NEXT: Block RThroughput: 24.0
3885 # CHECK: Timeline view:
3886 # CHECK-NEXT: 0123456789
3887 # CHECK-NEXT: Index 0123456789 0123456
3889 # CHECK: [0,0] DeeeER . . . .. st1 { v1.8b, v2.8b, v3.8b }, [x27], #24
3890 # CHECK-NEXT: [0,1] .DeE-R . . . .. add x0, x27, #1
3891 # CHECK-NEXT: [0,2] . D=eeeeeeER . . .. st1 { v1.8h, v2.8h, v3.8h }, [x27], #48
3892 # CHECK-NEXT: [0,3] . DeE----R . . .. add x0, x27, #1
3893 # CHECK-NEXT: [0,4] . D====eeeeeeER . .. st1 { v1.16b, v2.16b, v3.16b }, [x27], #48
3894 # CHECK-NEXT: [0,5] . . D===eE----R . .. add x0, x27, #1
3895 # CHECK-NEXT: [0,6] . . D=======eeeER .. st1 { v1.1d, v2.1d, v3.1d }, [x27], x28
3896 # CHECK-NEXT: [0,7] . . D=======eE-R .. add x0, x27, #1
3897 # CHECK-NEXT: [0,8] . . D========eeeeeeER st1 { v1.2d, v2.2d, v3.2d }, [x27], x28
3898 # CHECK-NEXT: [0,9] . . . D=======eE----R add x0, x27, #1
3900 # CHECK: Average Wait times (based on the timeline view):
3901 # CHECK-NEXT: [0]: Executions
3902 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3903 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3904 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3906 # CHECK: [0] [1] [2] [3]
3907 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8b, v2.8b, v3.8b }, [x27], #24
3908 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
3909 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 st1 { v1.8h, v2.8h, v3.8h }, [x27], #48
3910 # CHECK-NEXT: 3. 1 1.0 0.0 4.0 add x0, x27, #1
3911 # CHECK-NEXT: 4. 1 5.0 5.0 0.0 st1 { v1.16b, v2.16b, v3.16b }, [x27], #48
3912 # CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1
3913 # CHECK-NEXT: 6. 1 8.0 5.0 0.0 st1 { v1.1d, v2.1d, v3.1d }, [x27], x28
3914 # CHECK-NEXT: 7. 1 8.0 0.0 1.0 add x0, x27, #1
3915 # CHECK-NEXT: 8. 1 9.0 2.0 0.0 st1 { v1.2d, v2.2d, v3.2d }, [x27], x28
3916 # CHECK-NEXT: 9. 1 8.0 0.0 4.0 add x0, x27, #1
3917 # CHECK-NEXT: 1 4.7 1.5 1.4 <total>
3919 # CHECK: [60] Code Region - G61
3921 # CHECK: Iterations: 100
3922 # CHECK-NEXT: Instructions: 1000
3923 # CHECK-NEXT: Total Cycles: 2103
3924 # CHECK-NEXT: Total uOps: 3100
3926 # CHECK: Dispatch Width: 3
3927 # CHECK-NEXT: uOps Per Cycle: 1.47
3928 # CHECK-NEXT: IPC: 0.48
3929 # CHECK-NEXT: Block RThroughput: 21.0
3931 # CHECK: Timeline view:
3932 # CHECK-NEXT: 0123456789
3933 # CHECK-NEXT: Index 0123456789 0123
3935 # CHECK: [0,0] DeeeER . . . . st1 { v1.2s, v2.2s, v3.2s }, [x27], x28
3936 # CHECK-NEXT: [0,1] .DeE-R . . . . add x0, x27, #1
3937 # CHECK-NEXT: [0,2] . D=eeeER . . . . st1 { v1.4h, v2.4h, v3.4h }, [x27], x28
3938 # CHECK-NEXT: [0,3] . D=eE-R . . . . add x0, x27, #1
3939 # CHECK-NEXT: [0,4] . D==eeeeeeER. . . st1 { v1.4s, v2.4s, v3.4s }, [x27], x28
3940 # CHECK-NEXT: [0,5] . .D=eE----R. . . add x0, x27, #1
3941 # CHECK-NEXT: [0,6] . . D=====eeeER . . st1 { v1.8b, v2.8b, v3.8b }, [x27], x28
3942 # CHECK-NEXT: [0,7] . . D=====eE-R . . add x0, x27, #1
3943 # CHECK-NEXT: [0,8] . . D======eeeeeeER st1 { v1.8h, v2.8h, v3.8h }, [x27], x28
3944 # CHECK-NEXT: [0,9] . . .D=====eE----R add x0, x27, #1
3946 # CHECK: Average Wait times (based on the timeline view):
3947 # CHECK-NEXT: [0]: Executions
3948 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3949 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3950 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3952 # CHECK: [0] [1] [2] [3]
3953 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2s, v2.2s, v3.2s }, [x27], x28
3954 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
3955 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 st1 { v1.4h, v2.4h, v3.4h }, [x27], x28
3956 # CHECK-NEXT: 3. 1 2.0 0.0 1.0 add x0, x27, #1
3957 # CHECK-NEXT: 4. 1 3.0 2.0 0.0 st1 { v1.4s, v2.4s, v3.4s }, [x27], x28
3958 # CHECK-NEXT: 5. 1 2.0 0.0 4.0 add x0, x27, #1
3959 # CHECK-NEXT: 6. 1 6.0 5.0 0.0 st1 { v1.8b, v2.8b, v3.8b }, [x27], x28
3960 # CHECK-NEXT: 7. 1 6.0 0.0 1.0 add x0, x27, #1
3961 # CHECK-NEXT: 8. 1 7.0 2.0 0.0 st1 { v1.8h, v2.8h, v3.8h }, [x27], x28
3962 # CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1
3963 # CHECK-NEXT: 1 3.6 1.2 1.1 <total>
3965 # CHECK: [61] Code Region - G62
3967 # CHECK: Iterations: 100
3968 # CHECK-NEXT: Instructions: 1000
3969 # CHECK-NEXT: Total Cycles: 2603
3970 # CHECK-NEXT: Total uOps: 3600
3972 # CHECK: Dispatch Width: 3
3973 # CHECK-NEXT: uOps Per Cycle: 1.38
3974 # CHECK-NEXT: IPC: 0.38
3975 # CHECK-NEXT: Block RThroughput: 26.0
3977 # CHECK: Timeline view:
3978 # CHECK-NEXT: 0123456789
3979 # CHECK-NEXT: Index 0123456789 012345678
3981 # CHECK: [0,0] DeeeeeeER . . . . . st1 { v1.16b, v2.16b, v3.16b }, [x27], x28
3982 # CHECK-NEXT: [0,1] . DeE---R . . . . . add x0, x27, #1
3983 # CHECK-NEXT: [0,2] . D===eeeeER . . . . st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
3984 # CHECK-NEXT: [0,3] . D===eE--R . . . . add x0, x27, #1
3985 # CHECK-NEXT: [0,4] . D=====eeeeeeeeER . . st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
3986 # CHECK-NEXT: [0,5] . . D===eE------R . . add x0, x27, #1
3987 # CHECK-NEXT: [0,6] . . D=========eeeeER. . st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
3988 # CHECK-NEXT: [0,7] . . D=========eE--R. . add x0, x27, #1
3989 # CHECK-NEXT: [0,8] . . .D===========eeeeER st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
3990 # CHECK-NEXT: [0,9] . . . D===========eE--R add x0, x27, #1
3992 # CHECK: Average Wait times (based on the timeline view):
3993 # CHECK-NEXT: [0]: Executions
3994 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3995 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3996 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3998 # CHECK: [0] [1] [2] [3]
3999 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.16b, v2.16b, v3.16b }, [x27], x28
4000 # CHECK-NEXT: 1. 1 1.0 1.0 3.0 add x0, x27, #1
4001 # CHECK-NEXT: 2. 1 4.0 4.0 0.0 st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
4002 # CHECK-NEXT: 3. 1 4.0 0.0 2.0 add x0, x27, #1
4003 # CHECK-NEXT: 4. 1 6.0 3.0 0.0 st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
4004 # CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1
4005 # CHECK-NEXT: 6. 1 10.0 7.0 0.0 st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
4006 # CHECK-NEXT: 7. 1 10.0 0.0 2.0 add x0, x27, #1
4007 # CHECK-NEXT: 8. 1 12.0 3.0 0.0 st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
4008 # CHECK-NEXT: 9. 1 12.0 0.0 2.0 add x0, x27, #1
4009 # CHECK-NEXT: 1 6.4 1.9 1.5 <total>
4011 # CHECK: [62] Code Region - G63
4013 # CHECK: Iterations: 100
4014 # CHECK-NEXT: Instructions: 1000
4015 # CHECK-NEXT: Total Cycles: 3203
4016 # CHECK-NEXT: Total uOps: 4200
4018 # CHECK: Dispatch Width: 3
4019 # CHECK-NEXT: uOps Per Cycle: 1.31
4020 # CHECK-NEXT: IPC: 0.31
4021 # CHECK-NEXT: Block RThroughput: 32.0
4023 # CHECK: Timeline view:
4024 # CHECK-NEXT: 0123456789 01234
4025 # CHECK-NEXT: Index 0123456789 0123456789
4027 # CHECK: [0,0] DeeeeeeeeER . . . . . st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
4028 # CHECK-NEXT: [0,1] . DeE----R . . . . . add x0, x27, #1
4029 # CHECK-NEXT: [0,2] . D====eeeeER. . . . . st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
4030 # CHECK-NEXT: [0,3] . D====eE--R. . . . . add x0, x27, #1
4031 # CHECK-NEXT: [0,4] . .D======eeeeeeeeER . . . st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
4032 # CHECK-NEXT: [0,5] . . D====eE------R . . . add x0, x27, #1
4033 # CHECK-NEXT: [0,6] . . D==========eeeeeeeeER . st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
4034 # CHECK-NEXT: [0,7] . . . D========eE------R . add x0, x27, #1
4035 # CHECK-NEXT: [0,8] . . . D==============eeeeER st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
4036 # CHECK-NEXT: [0,9] . . . D==============eE--R add x0, x27, #1
4038 # CHECK: Average Wait times (based on the timeline view):
4039 # CHECK-NEXT: [0]: Executions
4040 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4041 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4042 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4044 # CHECK: [0] [1] [2] [3]
4045 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
4046 # CHECK-NEXT: 1. 1 1.0 1.0 4.0 add x0, x27, #1
4047 # CHECK-NEXT: 2. 1 5.0 5.0 0.0 st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
4048 # CHECK-NEXT: 3. 1 5.0 0.0 2.0 add x0, x27, #1
4049 # CHECK-NEXT: 4. 1 7.0 3.0 0.0 st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
4050 # CHECK-NEXT: 5. 1 5.0 0.0 6.0 add x0, x27, #1
4051 # CHECK-NEXT: 6. 1 11.0 7.0 0.0 st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
4052 # CHECK-NEXT: 7. 1 9.0 0.0 6.0 add x0, x27, #1
4053 # CHECK-NEXT: 8. 1 15.0 7.0 0.0 st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
4054 # CHECK-NEXT: 9. 1 15.0 0.0 2.0 add x0, x27, #1
4055 # CHECK-NEXT: 1 7.4 2.4 2.0 <total>
4057 # CHECK: [63] Code Region - G64
4059 # CHECK: Iterations: 100
4060 # CHECK-NEXT: Instructions: 1000
4061 # CHECK-NEXT: Total Cycles: 2803
4062 # CHECK-NEXT: Total uOps: 3800
4064 # CHECK: Dispatch Width: 3
4065 # CHECK-NEXT: uOps Per Cycle: 1.36
4066 # CHECK-NEXT: IPC: 0.36
4067 # CHECK-NEXT: Block RThroughput: 28.0
4069 # CHECK: Timeline view:
4070 # CHECK-NEXT: 0123456789 0
4071 # CHECK-NEXT: Index 0123456789 0123456789
4073 # CHECK: [0,0] DeeeeeeeeER . . . . st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
4074 # CHECK-NEXT: [0,1] . DeE----R . . . . add x0, x27, #1
4075 # CHECK-NEXT: [0,2] . D====eeeeER. . . . st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
4076 # CHECK-NEXT: [0,3] . D====eE--R. . . . add x0, x27, #1
4077 # CHECK-NEXT: [0,4] . .D======eeeeER . . . st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
4078 # CHECK-NEXT: [0,5] . . D======eE--R . . . add x0, x27, #1
4079 # CHECK-NEXT: [0,6] . . D========eeeeeeeeER . st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
4080 # CHECK-NEXT: [0,7] . . .D======eE------R . add x0, x27, #1
4081 # CHECK-NEXT: [0,8] . . . D============eeeeER st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
4082 # CHECK-NEXT: [0,9] . . . D============eE--R add x0, x27, #1
4084 # CHECK: Average Wait times (based on the timeline view):
4085 # CHECK-NEXT: [0]: Executions
4086 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4087 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4088 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4090 # CHECK: [0] [1] [2] [3]
4091 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
4092 # CHECK-NEXT: 1. 1 1.0 1.0 4.0 add x0, x27, #1
4093 # CHECK-NEXT: 2. 1 5.0 5.0 0.0 st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
4094 # CHECK-NEXT: 3. 1 5.0 0.0 2.0 add x0, x27, #1
4095 # CHECK-NEXT: 4. 1 7.0 3.0 0.0 st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
4096 # CHECK-NEXT: 5. 1 7.0 0.0 2.0 add x0, x27, #1
4097 # CHECK-NEXT: 6. 1 9.0 3.0 0.0 st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
4098 # CHECK-NEXT: 7. 1 7.0 0.0 6.0 add x0, x27, #1
4099 # CHECK-NEXT: 8. 1 13.0 7.0 0.0 st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
4100 # CHECK-NEXT: 9. 1 13.0 0.0 2.0 add x0, x27, #1
4101 # CHECK-NEXT: 1 6.8 2.0 1.6 <total>
4103 # CHECK: [64] Code Region - G65
4105 # CHECK: Iterations: 100
4106 # CHECK-NEXT: Instructions: 1000
4107 # CHECK-NEXT: Total Cycles: 1904
4108 # CHECK-NEXT: Total uOps: 2900
4110 # CHECK: Dispatch Width: 3
4111 # CHECK-NEXT: uOps Per Cycle: 1.52
4112 # CHECK-NEXT: IPC: 0.53
4113 # CHECK-NEXT: Block RThroughput: 19.0
4115 # CHECK: Timeline view:
4116 # CHECK-NEXT: 0123456789
4117 # CHECK-NEXT: Index 0123456789 012
4119 # CHECK: [0,0] DeeeeeeeeER . . . st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
4120 # CHECK-NEXT: [0,1] . DeE----R . . . add x0, x27, #1
4121 # CHECK-NEXT: [0,2] . D====eeeeeeeeER . . st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
4122 # CHECK-NEXT: [0,3] . . D==eE------R . . add x0, x27, #1
4123 # CHECK-NEXT: [0,4] . . D=========eER. . st1 { v1.b }[0], [x27], #1
4124 # CHECK-NEXT: [0,5] . . D=========eER . add x0, x27, #1
4125 # CHECK-NEXT: [0,6] . . D=========eER . st1 { v1.b }[8], [x27], #1
4126 # CHECK-NEXT: [0,7] . . D=========eER. add x0, x27, #1
4127 # CHECK-NEXT: [0,8] . . D=========eER. st1 { v1.b }[0], [x27], x28
4128 # CHECK-NEXT: [0,9] . . D=========eER add x0, x27, #1
4130 # CHECK: Average Wait times (based on the timeline view):
4131 # CHECK-NEXT: [0]: Executions
4132 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4133 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4134 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4136 # CHECK: [0] [1] [2] [3]
4137 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
4138 # CHECK-NEXT: 1. 1 1.0 1.0 4.0 add x0, x27, #1
4139 # CHECK-NEXT: 2. 1 5.0 5.0 0.0 st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
4140 # CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1
4141 # CHECK-NEXT: 4. 1 10.0 7.0 0.0 st1 { v1.b }[0], [x27], #1
4142 # CHECK-NEXT: 5. 1 10.0 0.0 0.0 add x0, x27, #1
4143 # CHECK-NEXT: 6. 1 10.0 0.0 0.0 st1 { v1.b }[8], [x27], #1
4144 # CHECK-NEXT: 7. 1 10.0 0.0 0.0 add x0, x27, #1
4145 # CHECK-NEXT: 8. 1 10.0 0.0 0.0 st1 { v1.b }[0], [x27], x28
4146 # CHECK-NEXT: 9. 1 10.0 0.0 0.0 add x0, x27, #1
4147 # CHECK-NEXT: 1 7.0 1.4 1.0 <total>
4149 # CHECK: [65] Code Region - G66
4151 # CHECK: Iterations: 100
4152 # CHECK-NEXT: Instructions: 1000
4153 # CHECK-NEXT: Total Cycles: 504
4154 # CHECK-NEXT: Total uOps: 1500
4156 # CHECK: Dispatch Width: 3
4157 # CHECK-NEXT: uOps Per Cycle: 2.98
4158 # CHECK-NEXT: IPC: 1.98
4159 # CHECK-NEXT: Block RThroughput: 5.0
4161 # CHECK: Timeline view:
4162 # CHECK-NEXT: Index 012345678
4164 # CHECK: [0,0] DeER . . st1 { v1.b }[8], [x27], x28
4165 # CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1
4166 # CHECK-NEXT: [0,2] .DeER. . st1 { v1.h }[0], [x27], #2
4167 # CHECK-NEXT: [0,3] .D=eER . add x0, x27, #1
4168 # CHECK-NEXT: [0,4] . DeER . st1 { v1.h }[4], [x27], #2
4169 # CHECK-NEXT: [0,5] . D=eER . add x0, x27, #1
4170 # CHECK-NEXT: [0,6] . DeER . st1 { v1.h }[0], [x27], x28
4171 # CHECK-NEXT: [0,7] . D=eER. add x0, x27, #1
4172 # CHECK-NEXT: [0,8] . DeER. st1 { v1.h }[4], [x27], x28
4173 # CHECK-NEXT: [0,9] . D=eER add x0, x27, #1
4175 # CHECK: Average Wait times (based on the timeline view):
4176 # CHECK-NEXT: [0]: Executions
4177 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4178 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4179 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4181 # CHECK: [0] [1] [2] [3]
4182 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.b }[8], [x27], x28
4183 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1
4184 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 st1 { v1.h }[0], [x27], #2
4185 # CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1
4186 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.h }[4], [x27], #2
4187 # CHECK-NEXT: 5. 1 2.0 0.0 0.0 add x0, x27, #1
4188 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 st1 { v1.h }[0], [x27], x28
4189 # CHECK-NEXT: 7. 1 2.0 0.0 0.0 add x0, x27, #1
4190 # CHECK-NEXT: 8. 1 1.0 0.0 0.0 st1 { v1.h }[4], [x27], x28
4191 # CHECK-NEXT: 9. 1 2.0 0.0 0.0 add x0, x27, #1
4192 # CHECK-NEXT: 1 1.5 0.1 0.0 <total>
4194 # CHECK: [66] Code Region - G67
4196 # CHECK: Iterations: 100
4197 # CHECK-NEXT: Instructions: 1000
4198 # CHECK-NEXT: Total Cycles: 805
4199 # CHECK-NEXT: Total uOps: 2000
4201 # CHECK: Dispatch Width: 3
4202 # CHECK-NEXT: uOps Per Cycle: 2.48
4203 # CHECK-NEXT: IPC: 1.24
4204 # CHECK-NEXT: Block RThroughput: 8.0
4206 # CHECK: Timeline view:
4208 # CHECK-NEXT: Index 0123456789
4210 # CHECK: [0,0] DeER . . . st1 { v1.s }[0], [x27], #4
4211 # CHECK-NEXT: [0,1] D=eER. . . add x0, x27, #1
4212 # CHECK-NEXT: [0,2] .DeER. . . st1 { v1.s }[0], [x27], x28
4213 # CHECK-NEXT: [0,3] .D=eER . . add x0, x27, #1
4214 # CHECK-NEXT: [0,4] . DeeeER . . st1 { v1.d }[0], [x27], #8
4215 # CHECK-NEXT: [0,5] . DeE-R . . add x0, x27, #1
4216 # CHECK-NEXT: [0,6] . DeeeER. . st1 { v1.d }[0], [x27], x28
4217 # CHECK-NEXT: [0,7] . DeE-R. . add x0, x27, #1
4218 # CHECK-NEXT: [0,8] . .DeeeeER st2 { v1.2d, v2.2d }, [x27], #32
4219 # CHECK-NEXT: [0,9] . . DeE--R add x0, x27, #1
4221 # CHECK: Average Wait times (based on the timeline view):
4222 # CHECK-NEXT: [0]: Executions
4223 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4224 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4225 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4227 # CHECK: [0] [1] [2] [3]
4228 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.s }[0], [x27], #4
4229 # CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1
4230 # CHECK-NEXT: 2. 1 1.0 0.0 0.0 st1 { v1.s }[0], [x27], x28
4231 # CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1
4232 # CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.d }[0], [x27], #8
4233 # CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1
4234 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 st1 { v1.d }[0], [x27], x28
4235 # CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1
4236 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 st2 { v1.2d, v2.2d }, [x27], #32
4237 # CHECK-NEXT: 9. 1 1.0 0.0 2.0 add x0, x27, #1
4238 # CHECK-NEXT: 1 1.2 0.3 0.4 <total>
4240 # CHECK: [67] Code Region - G68
4242 # CHECK: Iterations: 100
4243 # CHECK-NEXT: Instructions: 1000
4244 # CHECK-NEXT: Total Cycles: 1403
4245 # CHECK-NEXT: Total uOps: 3100
4247 # CHECK: Dispatch Width: 3
4248 # CHECK-NEXT: uOps Per Cycle: 2.21
4249 # CHECK-NEXT: IPC: 0.71
4250 # CHECK-NEXT: Block RThroughput: 14.0
4252 # CHECK: Timeline view:
4253 # CHECK-NEXT: 0123456
4254 # CHECK-NEXT: Index 0123456789
4256 # CHECK: [0,0] DeeeER . .. st2 { v1.2s, v2.2s }, [x27], #16
4257 # CHECK-NEXT: [0,1] .DeE-R . .. add x0, x27, #1
4258 # CHECK-NEXT: [0,2] . DeeeER . .. st2 { v1.4h, v2.4h }, [x27], #16
4259 # CHECK-NEXT: [0,3] . DeE-R . .. add x0, x27, #1
4260 # CHECK-NEXT: [0,4] . DeeeeER .. st2 { v1.4s, v2.4s }, [x27], #32
4261 # CHECK-NEXT: [0,5] . .DeE-R .. add x0, x27, #1
4262 # CHECK-NEXT: [0,6] . . D=eeeER .. st2 { v1.8b, v2.8b }, [x27], #16
4263 # CHECK-NEXT: [0,7] . . D=eE-R .. add x0, x27, #1
4264 # CHECK-NEXT: [0,8] . . D=eeeeER st2 { v1.8h, v2.8h }, [x27], #32
4265 # CHECK-NEXT: [0,9] . . .DeE--R add x0, x27, #1
4267 # CHECK: Average Wait times (based on the timeline view):
4268 # CHECK-NEXT: [0]: Executions
4269 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4270 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4271 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4273 # CHECK: [0] [1] [2] [3]
4274 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.2s, v2.2s }, [x27], #16
4275 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
4276 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 st2 { v1.4h, v2.4h }, [x27], #16
4277 # CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1
4278 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 st2 { v1.4s, v2.4s }, [x27], #32
4279 # CHECK-NEXT: 5. 1 1.0 1.0 1.0 add x0, x27, #1
4280 # CHECK-NEXT: 6. 1 2.0 2.0 0.0 st2 { v1.8b, v2.8b }, [x27], #16
4281 # CHECK-NEXT: 7. 1 2.0 0.0 1.0 add x0, x27, #1
4282 # CHECK-NEXT: 8. 1 2.0 1.0 0.0 st2 { v1.8h, v2.8h }, [x27], #32
4283 # CHECK-NEXT: 9. 1 1.0 0.0 2.0 add x0, x27, #1
4284 # CHECK-NEXT: 1 1.3 0.7 0.6 <total>
4286 # CHECK: [68] Code Region - G69
4288 # CHECK: Iterations: 100
4289 # CHECK-NEXT: Instructions: 1000
4290 # CHECK-NEXT: Total Cycles: 1603
4291 # CHECK-NEXT: Total uOps: 3200
4293 # CHECK: Dispatch Width: 3
4294 # CHECK-NEXT: uOps Per Cycle: 2.00
4295 # CHECK-NEXT: IPC: 0.62
4296 # CHECK-NEXT: Block RThroughput: 16.0
4298 # CHECK: Timeline view:
4299 # CHECK-NEXT: 012345678
4300 # CHECK-NEXT: Index 0123456789
4302 # CHECK: [0,0] DeeeeER . . . st2 { v1.16b, v2.16b }, [x27], #32
4303 # CHECK-NEXT: [0,1] . DeE-R . . . add x0, x27, #1
4304 # CHECK-NEXT: [0,2] . D=eeeeER . . st2 { v1.2d, v2.2d }, [x27], x28
4305 # CHECK-NEXT: [0,3] . D=eE--R . . add x0, x27, #1
4306 # CHECK-NEXT: [0,4] . D===eeeER . . st2 { v1.2s, v2.2s }, [x27], x28
4307 # CHECK-NEXT: [0,5] . .D===eE-R . . add x0, x27, #1
4308 # CHECK-NEXT: [0,6] . . D===eeeER . st2 { v1.4h, v2.4h }, [x27], x28
4309 # CHECK-NEXT: [0,7] . . D===eE-R . add x0, x27, #1
4310 # CHECK-NEXT: [0,8] . . D===eeeeER st2 { v1.4s, v2.4s }, [x27], x28
4311 # CHECK-NEXT: [0,9] . . .D==eE--R add x0, x27, #1
4313 # CHECK: Average Wait times (based on the timeline view):
4314 # CHECK-NEXT: [0]: Executions
4315 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4316 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4317 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4319 # CHECK: [0] [1] [2] [3]
4320 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.16b, v2.16b }, [x27], #32
4321 # CHECK-NEXT: 1. 1 1.0 1.0 1.0 add x0, x27, #1
4322 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 st2 { v1.2d, v2.2d }, [x27], x28
4323 # CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1
4324 # CHECK-NEXT: 4. 1 4.0 3.0 0.0 st2 { v1.2s, v2.2s }, [x27], x28
4325 # CHECK-NEXT: 5. 1 4.0 0.0 1.0 add x0, x27, #1
4326 # CHECK-NEXT: 6. 1 4.0 1.0 0.0 st2 { v1.4h, v2.4h }, [x27], x28
4327 # CHECK-NEXT: 7. 1 4.0 0.0 1.0 add x0, x27, #1
4328 # CHECK-NEXT: 8. 1 4.0 1.0 0.0 st2 { v1.4s, v2.4s }, [x27], x28
4329 # CHECK-NEXT: 9. 1 3.0 0.0 2.0 add x0, x27, #1
4330 # CHECK-NEXT: 1 2.9 0.9 0.7 <total>
4332 # CHECK: [69] Code Region - G70
4334 # CHECK: Iterations: 100
4335 # CHECK-NEXT: Instructions: 1000
4336 # CHECK-NEXT: Total Cycles: 1205
4337 # CHECK-NEXT: Total uOps: 2900
4339 # CHECK: Dispatch Width: 3
4340 # CHECK-NEXT: uOps Per Cycle: 2.41
4341 # CHECK-NEXT: IPC: 0.83
4342 # CHECK-NEXT: Block RThroughput: 12.0
4344 # CHECK: Timeline view:
4345 # CHECK-NEXT: 0123456
4346 # CHECK-NEXT: Index 0123456789
4348 # CHECK: [0,0] DeeeER . .. st2 { v1.8b, v2.8b }, [x27], x28
4349 # CHECK-NEXT: [0,1] .DeE-R . .. add x0, x27, #1
4350 # CHECK-NEXT: [0,2] . DeeeeER . .. st2 { v1.8h, v2.8h }, [x27], x28
4351 # CHECK-NEXT: [0,3] . DeE-R . .. add x0, x27, #1
4352 # CHECK-NEXT: [0,4] . D=eeeeER .. st2 { v1.16b, v2.16b }, [x27], x28
4353 # CHECK-NEXT: [0,5] . . DeE--R .. add x0, x27, #1
4354 # CHECK-NEXT: [0,6] . . D==eeeER. st2 { v1.b, v2.b }[0], [x27], #2
4355 # CHECK-NEXT: [0,7] . . D==eE-R. add x0, x27, #1
4356 # CHECK-NEXT: [0,8] . . D=eeeER st2 { v1.b, v2.b }[8], [x27], #2
4357 # CHECK-NEXT: [0,9] . . .D=eE-R add x0, x27, #1
4359 # CHECK: Average Wait times (based on the timeline view):
4360 # CHECK-NEXT: [0]: Executions
4361 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4362 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4363 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4365 # CHECK: [0] [1] [2] [3]
4366 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.8b, v2.8b }, [x27], x28
4367 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
4368 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 st2 { v1.8h, v2.8h }, [x27], x28
4369 # CHECK-NEXT: 3. 1 1.0 1.0 1.0 add x0, x27, #1
4370 # CHECK-NEXT: 4. 1 2.0 2.0 0.0 st2 { v1.16b, v2.16b }, [x27], x28
4371 # CHECK-NEXT: 5. 1 1.0 0.0 2.0 add x0, x27, #1
4372 # CHECK-NEXT: 6. 1 3.0 3.0 0.0 st2 { v1.b, v2.b }[0], [x27], #2
4373 # CHECK-NEXT: 7. 1 3.0 0.0 1.0 add x0, x27, #1
4374 # CHECK-NEXT: 8. 1 2.0 0.0 0.0 st2 { v1.b, v2.b }[8], [x27], #2
4375 # CHECK-NEXT: 9. 1 2.0 0.0 1.0 add x0, x27, #1
4376 # CHECK-NEXT: 1 1.7 0.8 0.6 <total>
4378 # CHECK: [70] Code Region - G71
4380 # CHECK: Iterations: 100
4381 # CHECK-NEXT: Instructions: 1000
4382 # CHECK-NEXT: Total Cycles: 1004
4383 # CHECK-NEXT: Total uOps: 2000
4385 # CHECK: Dispatch Width: 3
4386 # CHECK-NEXT: uOps Per Cycle: 1.99
4387 # CHECK-NEXT: IPC: 1.00
4388 # CHECK-NEXT: Block RThroughput: 6.7
4390 # CHECK: Timeline view:
4392 # CHECK-NEXT: Index 0123456789
4394 # CHECK: [0,0] DeeeER . . st2 { v1.b, v2.b }[0], [x27], x28
4395 # CHECK-NEXT: [0,1] .DeE-R . . add x0, x27, #1
4396 # CHECK-NEXT: [0,2] . DeeeER . . st2 { v1.b, v2.b }[8], [x27], x28
4397 # CHECK-NEXT: [0,3] . DeE-R . . add x0, x27, #1
4398 # CHECK-NEXT: [0,4] . DeeeER. . st2 { v1.h, v2.h }[0], [x27], #4
4399 # CHECK-NEXT: [0,5] . DeE-R. . add x0, x27, #1
4400 # CHECK-NEXT: [0,6] . .DeeeER . st2 { v1.h, v2.h }[4], [x27], #4
4401 # CHECK-NEXT: [0,7] . . DeE-R . add x0, x27, #1
4402 # CHECK-NEXT: [0,8] . . DeeeER st2 { v1.h, v2.h }[0], [x27], x28
4403 # CHECK-NEXT: [0,9] . . DeE-R add x0, x27, #1
4405 # CHECK: Average Wait times (based on the timeline view):
4406 # CHECK-NEXT: [0]: Executions
4407 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4408 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4409 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4411 # CHECK: [0] [1] [2] [3]
4412 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.b, v2.b }[0], [x27], x28
4413 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
4414 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 st2 { v1.b, v2.b }[8], [x27], x28
4415 # CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1
4416 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[0], [x27], #4
4417 # CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1
4418 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[4], [x27], #4
4419 # CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1
4420 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[0], [x27], x28
4421 # CHECK-NEXT: 9. 1 1.0 0.0 1.0 add x0, x27, #1
4422 # CHECK-NEXT: 1 1.0 0.5 0.5 <total>
4424 # CHECK: [71] Code Region - G72
4426 # CHECK: Iterations: 100
4427 # CHECK-NEXT: Instructions: 1000
4428 # CHECK-NEXT: Total Cycles: 1003
4429 # CHECK-NEXT: Total uOps: 2000
4431 # CHECK: Dispatch Width: 3
4432 # CHECK-NEXT: uOps Per Cycle: 1.99
4433 # CHECK-NEXT: IPC: 1.00
4434 # CHECK-NEXT: Block RThroughput: 7.0
4436 # CHECK: Timeline view:
4438 # CHECK-NEXT: Index 0123456789
4440 # CHECK: [0,0] DeeeER . . st2 { v1.h, v2.h }[4], [x27], x28
4441 # CHECK-NEXT: [0,1] .DeE-R . . add x0, x27, #1
4442 # CHECK-NEXT: [0,2] . DeeeER . . st2 { v1.s, v2.s }[0], [x27], #8
4443 # CHECK-NEXT: [0,3] . DeE-R . . add x0, x27, #1
4444 # CHECK-NEXT: [0,4] . DeeeER. . st2 { v1.s, v2.s }[0], [x27], x28
4445 # CHECK-NEXT: [0,5] . DeE-R. . add x0, x27, #1
4446 # CHECK-NEXT: [0,6] . .DeeER . st2 { v1.d, v2.d }[0], [x27], #16
4447 # CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1
4448 # CHECK-NEXT: [0,8] . . DeeER st2 { v1.d, v2.d }[0], [x27], x28
4449 # CHECK-NEXT: [0,9] . . DeER add x0, x27, #1
4451 # CHECK: Average Wait times (based on the timeline view):
4452 # CHECK-NEXT: [0]: Executions
4453 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4454 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4455 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4457 # CHECK: [0] [1] [2] [3]
4458 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[4], [x27], x28
4459 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
4460 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 st2 { v1.s, v2.s }[0], [x27], #8
4461 # CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1
4462 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 st2 { v1.s, v2.s }[0], [x27], x28
4463 # CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1
4464 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 st2 { v1.d, v2.d }[0], [x27], #16
4465 # CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1
4466 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 st2 { v1.d, v2.d }[0], [x27], x28
4467 # CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1
4468 # CHECK-NEXT: 1 1.0 0.5 0.3 <total>
4470 # CHECK: [72] Code Region - G73
4472 # CHECK: Iterations: 100
4473 # CHECK-NEXT: Instructions: 600
4474 # CHECK-NEXT: Total Cycles: 1203
4475 # CHECK-NEXT: Total uOps: 2200
4477 # CHECK: Dispatch Width: 3
4478 # CHECK-NEXT: uOps Per Cycle: 1.83
4479 # CHECK-NEXT: IPC: 0.50
4480 # CHECK-NEXT: Block RThroughput: 12.0
4482 # CHECK: Timeline view:
4484 # CHECK-NEXT: Index 0123456789
4486 # CHECK: [0,0] DeeeeeeER . . st3 { v1.2d, v2.2d, v3.2d }, [x27], #48
4487 # CHECK-NEXT: [0,1] . DeE---R . . add x0, x27, #1
4488 # CHECK-NEXT: [0,2] . D===eeeER . st3 { v1.2s, v2.2s, v3.2s }, [x27], #24
4489 # CHECK-NEXT: [0,3] . D==eE-R . add x0, x27, #1
4490 # CHECK-NEXT: [0,4] . .D===eeeER st3 { v1.4h, v2.4h, v3.4h }, [x27], #24
4491 # CHECK-NEXT: [0,5] . . D==eE-R add x0, x27, #1
4493 # CHECK: Average Wait times (based on the timeline view):
4494 # CHECK-NEXT: [0]: Executions
4495 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4496 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4497 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4499 # CHECK: [0] [1] [2] [3]
4500 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.2d, v2.2d, v3.2d }, [x27], #48
4501 # CHECK-NEXT: 1. 1 1.0 1.0 3.0 add x0, x27, #1
4502 # CHECK-NEXT: 2. 1 4.0 4.0 0.0 st3 { v1.2s, v2.2s, v3.2s }, [x27], #24
4503 # CHECK-NEXT: 3. 1 3.0 0.0 1.0 add x0, x27, #1
4504 # CHECK-NEXT: 4. 1 4.0 2.0 0.0 st3 { v1.4h, v2.4h, v3.4h }, [x27], #24
4505 # CHECK-NEXT: 5. 1 3.0 0.0 1.0 add x0, x27, #1
4506 # CHECK-NEXT: 1 2.7 1.3 0.8 <total>
4508 # CHECK: [73] Code Region - G74
4510 # CHECK: Iterations: 100
4511 # CHECK-NEXT: Instructions: 1000
4512 # CHECK-NEXT: Total Cycles: 2703
4513 # CHECK-NEXT: Total uOps: 5100
4515 # CHECK: Dispatch Width: 3
4516 # CHECK-NEXT: uOps Per Cycle: 1.89
4517 # CHECK-NEXT: IPC: 0.37
4518 # CHECK-NEXT: Block RThroughput: 27.0
4520 # CHECK: Timeline view:
4521 # CHECK-NEXT: 0123456789
4522 # CHECK-NEXT: Index 0123456789 0123456789
4524 # CHECK: [0,0] DeeeeeeER . . . . . st3 { v1.4s, v2.4s, v3.4s }, [x27], #48
4525 # CHECK-NEXT: [0,1] . DeE--R . . . . . add x0, x27, #1
4526 # CHECK-NEXT: [0,2] . D==eeeER . . . . st3 { v1.8b, v2.8b, v3.8b }, [x27], #24
4527 # CHECK-NEXT: [0,3] . .D=eE-R . . . . add x0, x27, #1
4528 # CHECK-NEXT: [0,4] . . D==eeeeeeER . . . st3 { v1.8h, v2.8h, v3.8h }, [x27], #48
4529 # CHECK-NEXT: [0,5] . . DeE----R . . . add x0, x27, #1
4530 # CHECK-NEXT: [0,6] . . .D====eeeeeeER . . st3 { v1.16b, v2.16b, v3.16b }, [x27], #48
4531 # CHECK-NEXT: [0,7] . . . D==eE----R . . add x0, x27, #1
4532 # CHECK-NEXT: [0,8] . . . D======eeeeeeER st3 { v1.2d, v2.2d, v3.2d }, [x27], x28
4533 # CHECK-NEXT: [0,9] . . . . D=====eE----R add x0, x27, #1
4535 # CHECK: Average Wait times (based on the timeline view):
4536 # CHECK-NEXT: [0]: Executions
4537 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4538 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4539 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4541 # CHECK: [0] [1] [2] [3]
4542 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.4s, v2.4s, v3.4s }, [x27], #48
4543 # CHECK-NEXT: 1. 1 1.0 1.0 2.0 add x0, x27, #1
4544 # CHECK-NEXT: 2. 1 3.0 3.0 0.0 st3 { v1.8b, v2.8b, v3.8b }, [x27], #24
4545 # CHECK-NEXT: 3. 1 2.0 0.0 1.0 add x0, x27, #1
4546 # CHECK-NEXT: 4. 1 3.0 2.0 0.0 st3 { v1.8h, v2.8h, v3.8h }, [x27], #48
4547 # CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1
4548 # CHECK-NEXT: 6. 1 5.0 5.0 0.0 st3 { v1.16b, v2.16b, v3.16b }, [x27], #48
4549 # CHECK-NEXT: 7. 1 3.0 0.0 4.0 add x0, x27, #1
4550 # CHECK-NEXT: 8. 1 7.0 5.0 0.0 st3 { v1.2d, v2.2d, v3.2d }, [x27], x28
4551 # CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1
4552 # CHECK-NEXT: 1 3.2 1.7 1.5 <total>
4554 # CHECK: [74] Code Region - G75
4556 # CHECK: Iterations: 100
4557 # CHECK-NEXT: Instructions: 1000
4558 # CHECK-NEXT: Total Cycles: 2103
4559 # CHECK-NEXT: Total uOps: 4500
4561 # CHECK: Dispatch Width: 3
4562 # CHECK-NEXT: uOps Per Cycle: 2.14
4563 # CHECK-NEXT: IPC: 0.48
4564 # CHECK-NEXT: Block RThroughput: 21.0
4566 # CHECK: Timeline view:
4567 # CHECK-NEXT: 0123456789
4568 # CHECK-NEXT: Index 0123456789 0123
4570 # CHECK: [0,0] DeeeER . . . . st3 { v1.2s, v2.2s, v3.2s }, [x27], x28
4571 # CHECK-NEXT: [0,1] . DeER . . . . add x0, x27, #1
4572 # CHECK-NEXT: [0,2] . DeeeER . . . . st3 { v1.4h, v2.4h, v3.4h }, [x27], x28
4573 # CHECK-NEXT: [0,3] . DeER . . . . add x0, x27, #1
4574 # CHECK-NEXT: [0,4] . .DeeeeeeER. . . st3 { v1.4s, v2.4s, v3.4s }, [x27], x28
4575 # CHECK-NEXT: [0,5] . . DeE--R. . . add x0, x27, #1
4576 # CHECK-NEXT: [0,6] . . D==eeeER . . st3 { v1.8b, v2.8b, v3.8b }, [x27], x28
4577 # CHECK-NEXT: [0,7] . . . D=eE-R . . add x0, x27, #1
4578 # CHECK-NEXT: [0,8] . . . D==eeeeeeER st3 { v1.8h, v2.8h, v3.8h }, [x27], x28
4579 # CHECK-NEXT: [0,9] . . . .DeE----R add x0, x27, #1
4581 # CHECK: Average Wait times (based on the timeline view):
4582 # CHECK-NEXT: [0]: Executions
4583 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4584 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4585 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4587 # CHECK: [0] [1] [2] [3]
4588 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.2s, v2.2s, v3.2s }, [x27], x28
4589 # CHECK-NEXT: 1. 1 1.0 1.0 0.0 add x0, x27, #1
4590 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 st3 { v1.4h, v2.4h, v3.4h }, [x27], x28
4591 # CHECK-NEXT: 3. 1 1.0 1.0 0.0 add x0, x27, #1
4592 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 st3 { v1.4s, v2.4s, v3.4s }, [x27], x28
4593 # CHECK-NEXT: 5. 1 1.0 1.0 2.0 add x0, x27, #1
4594 # CHECK-NEXT: 6. 1 3.0 3.0 0.0 st3 { v1.8b, v2.8b, v3.8b }, [x27], x28
4595 # CHECK-NEXT: 7. 1 2.0 0.0 1.0 add x0, x27, #1
4596 # CHECK-NEXT: 8. 1 3.0 2.0 0.0 st3 { v1.8h, v2.8h, v3.8h }, [x27], x28
4597 # CHECK-NEXT: 9. 1 1.0 0.0 4.0 add x0, x27, #1
4598 # CHECK-NEXT: 1 1.5 1.1 0.7 <total>
4600 # CHECK: [75] Code Region - G76
4602 # CHECK: Iterations: 100
4603 # CHECK-NEXT: Instructions: 1000
4604 # CHECK-NEXT: Total Cycles: 1204
4605 # CHECK-NEXT: Total uOps: 2800
4607 # CHECK: Dispatch Width: 3
4608 # CHECK-NEXT: uOps Per Cycle: 2.33
4609 # CHECK-NEXT: IPC: 0.83
4610 # CHECK-NEXT: Block RThroughput: 10.0
4612 # CHECK: Timeline view:
4613 # CHECK-NEXT: 012345
4614 # CHECK-NEXT: Index 0123456789
4616 # CHECK: [0,0] DeeeeeeER . . st3 { v1.16b, v2.16b, v3.16b }, [x27], x28
4617 # CHECK-NEXT: [0,1] . DeE--R . . add x0, x27, #1
4618 # CHECK-NEXT: [0,2] . D==eeeER . st3 { v1.b, v2.b, v3.b }[0], [x27], #3
4619 # CHECK-NEXT: [0,3] . D==eE-R . add x0, x27, #1
4620 # CHECK-NEXT: [0,4] . .D=eeeER . st3 { v1.b, v2.b, v3.b }[8], [x27], #3
4621 # CHECK-NEXT: [0,5] . . D=eE-R . add x0, x27, #1
4622 # CHECK-NEXT: [0,6] . . DeeeER . st3 { v1.b, v2.b, v3.b }[0], [x27], x28
4623 # CHECK-NEXT: [0,7] . . DeE-R . add x0, x27, #1
4624 # CHECK-NEXT: [0,8] . . DeeeER st3 { v1.b, v2.b, v3.b }[8], [x27], x28
4625 # CHECK-NEXT: [0,9] . . .DeE-R add x0, x27, #1
4627 # CHECK: Average Wait times (based on the timeline view):
4628 # CHECK-NEXT: [0]: Executions
4629 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4630 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4631 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4633 # CHECK: [0] [1] [2] [3]
4634 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.16b, v2.16b, v3.16b }, [x27], x28
4635 # CHECK-NEXT: 1. 1 1.0 1.0 2.0 add x0, x27, #1
4636 # CHECK-NEXT: 2. 1 3.0 3.0 0.0 st3 { v1.b, v2.b, v3.b }[0], [x27], #3
4637 # CHECK-NEXT: 3. 1 3.0 0.0 1.0 add x0, x27, #1
4638 # CHECK-NEXT: 4. 1 2.0 0.0 0.0 st3 { v1.b, v2.b, v3.b }[8], [x27], #3
4639 # CHECK-NEXT: 5. 1 2.0 0.0 1.0 add x0, x27, #1
4640 # CHECK-NEXT: 6. 1 1.0 0.0 0.0 st3 { v1.b, v2.b, v3.b }[0], [x27], x28
4641 # CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1
4642 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 st3 { v1.b, v2.b, v3.b }[8], [x27], x28
4643 # CHECK-NEXT: 9. 1 1.0 0.0 1.0 add x0, x27, #1
4644 # CHECK-NEXT: 1 1.6 0.6 0.6 <total>
4646 # CHECK: [76] Code Region - G77
4648 # CHECK: Iterations: 100
4649 # CHECK-NEXT: Instructions: 1000
4650 # CHECK-NEXT: Total Cycles: 1004
4651 # CHECK-NEXT: Total uOps: 2100
4653 # CHECK: Dispatch Width: 3
4654 # CHECK-NEXT: uOps Per Cycle: 2.09
4655 # CHECK-NEXT: IPC: 1.00
4656 # CHECK-NEXT: Block RThroughput: 7.0
4658 # CHECK: Timeline view:
4660 # CHECK-NEXT: Index 0123456789
4662 # CHECK: [0,0] DeeeER . . st3 { v1.h, v2.h, v3.h }[0], [x27], #6
4663 # CHECK-NEXT: [0,1] .DeE-R . . add x0, x27, #1
4664 # CHECK-NEXT: [0,2] . DeeeER . . st3 { v1.h, v2.h, v3.h }[4], [x27], #6
4665 # CHECK-NEXT: [0,3] . DeE-R . . add x0, x27, #1
4666 # CHECK-NEXT: [0,4] . DeeeER. . st3 { v1.h, v2.h, v3.h }[0], [x27], x28
4667 # CHECK-NEXT: [0,5] . DeE-R. . add x0, x27, #1
4668 # CHECK-NEXT: [0,6] . .DeeeER . st3 { v1.h, v2.h, v3.h }[4], [x27], x28
4669 # CHECK-NEXT: [0,7] . . DeE-R . add x0, x27, #1
4670 # CHECK-NEXT: [0,8] . . DeeeER st3 { v1.s, v2.s, v3.s }[0], [x27], #12
4671 # CHECK-NEXT: [0,9] . . DeE-R add x0, x27, #1
4673 # CHECK: Average Wait times (based on the timeline view):
4674 # CHECK-NEXT: [0]: Executions
4675 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4676 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4677 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4679 # CHECK: [0] [1] [2] [3]
4680 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[0], [x27], #6
4681 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
4682 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[4], [x27], #6
4683 # CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1
4684 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[0], [x27], x28
4685 # CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1
4686 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[4], [x27], x28
4687 # CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1
4688 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 st3 { v1.s, v2.s, v3.s }[0], [x27], #12
4689 # CHECK-NEXT: 9. 1 1.0 0.0 1.0 add x0, x27, #1
4690 # CHECK-NEXT: 1 1.0 0.5 0.5 <total>
4692 # CHECK: [77] Code Region - G78
4694 # CHECK: Iterations: 100
4695 # CHECK-NEXT: Instructions: 1000
4696 # CHECK-NEXT: Total Cycles: 1903
4697 # CHECK-NEXT: Total uOps: 3300
4699 # CHECK: Dispatch Width: 3
4700 # CHECK-NEXT: uOps Per Cycle: 1.73
4701 # CHECK-NEXT: IPC: 0.53
4702 # CHECK-NEXT: Block RThroughput: 19.0
4704 # CHECK: Timeline view:
4705 # CHECK-NEXT: 0123456789
4706 # CHECK-NEXT: Index 0123456789 01
4708 # CHECK: [0,0] DeeeER . . .. st3 { v1.s, v2.s, v3.s }[0], [x27], x28
4709 # CHECK-NEXT: [0,1] .DeE-R . . .. add x0, x27, #1
4710 # CHECK-NEXT: [0,2] . D=eeeER . . .. st3 { v1.d, v2.d, v3.d }[0], [x27], #24
4711 # CHECK-NEXT: [0,3] . D=eE-R . . .. add x0, x27, #1
4712 # CHECK-NEXT: [0,4] . D=eeeER . .. st3 { v1.d, v2.d, v3.d }[0], [x27], x28
4713 # CHECK-NEXT: [0,5] . D=eE-R . .. add x0, x27, #1
4714 # CHECK-NEXT: [0,6] . .D=eeeeeeeeER .. st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
4715 # CHECK-NEXT: [0,7] . . DeE-----R .. add x0, x27, #1
4716 # CHECK-NEXT: [0,8] . . D=====eeeeER st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
4717 # CHECK-NEXT: [0,9] . . . D====eE--R add x0, x27, #1
4719 # CHECK: Average Wait times (based on the timeline view):
4720 # CHECK-NEXT: [0]: Executions
4721 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4722 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4723 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4725 # CHECK: [0] [1] [2] [3]
4726 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.s, v2.s, v3.s }[0], [x27], x28
4727 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
4728 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 st3 { v1.d, v2.d, v3.d }[0], [x27], #24
4729 # CHECK-NEXT: 3. 1 2.0 0.0 1.0 add x0, x27, #1
4730 # CHECK-NEXT: 4. 1 2.0 1.0 0.0 st3 { v1.d, v2.d, v3.d }[0], [x27], x28
4731 # CHECK-NEXT: 5. 1 2.0 0.0 1.0 add x0, x27, #1
4732 # CHECK-NEXT: 6. 1 2.0 1.0 0.0 st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
4733 # CHECK-NEXT: 7. 1 1.0 1.0 5.0 add x0, x27, #1
4734 # CHECK-NEXT: 8. 1 6.0 6.0 0.0 st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
4735 # CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1
4736 # CHECK-NEXT: 1 2.4 1.2 1.0 <total>
4738 # CHECK: [78] Code Region - G79
4740 # CHECK: Iterations: 100
4741 # CHECK-NEXT: Instructions: 1000
4742 # CHECK-NEXT: Total Cycles: 3203
4743 # CHECK-NEXT: Total uOps: 5800
4745 # CHECK: Dispatch Width: 3
4746 # CHECK-NEXT: uOps Per Cycle: 1.81
4747 # CHECK-NEXT: IPC: 0.31
4748 # CHECK-NEXT: Block RThroughput: 32.0
4750 # CHECK: Timeline view:
4751 # CHECK-NEXT: 0123456789 01234
4752 # CHECK-NEXT: Index 0123456789 0123456789
4754 # CHECK: [0,0] DeeeeER . . . . . . st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
4755 # CHECK-NEXT: [0,1] . DeE-R . . . . . . add x0, x27, #1
4756 # CHECK-NEXT: [0,2] . D=eeeeeeeeER. . . . . st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
4757 # CHECK-NEXT: [0,3] . . DeE----R. . . . . add x0, x27, #1
4758 # CHECK-NEXT: [0,4] . . D====eeeeER . . . . st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
4759 # CHECK-NEXT: [0,5] . . D===eE--R . . . . add x0, x27, #1
4760 # CHECK-NEXT: [0,6] . . .D=====eeeeeeeeER . . st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
4761 # CHECK-NEXT: [0,7] . . . D==eE------R . . add x0, x27, #1
4762 # CHECK-NEXT: [0,8] . . . .D========eeeeeeeeER st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
4763 # CHECK-NEXT: [0,9] . . . . D=====eE------R add x0, x27, #1
4765 # CHECK: Average Wait times (based on the timeline view):
4766 # CHECK-NEXT: [0]: Executions
4767 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4768 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4769 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4771 # CHECK: [0] [1] [2] [3]
4772 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
4773 # CHECK-NEXT: 1. 1 1.0 1.0 1.0 add x0, x27, #1
4774 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
4775 # CHECK-NEXT: 3. 1 1.0 1.0 4.0 add x0, x27, #1
4776 # CHECK-NEXT: 4. 1 5.0 5.0 0.0 st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
4777 # CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1
4778 # CHECK-NEXT: 6. 1 6.0 3.0 0.0 st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
4779 # CHECK-NEXT: 7. 1 3.0 0.0 6.0 add x0, x27, #1
4780 # CHECK-NEXT: 8. 1 9.0 7.0 0.0 st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
4781 # CHECK-NEXT: 9. 1 6.0 0.0 6.0 add x0, x27, #1
4782 # CHECK-NEXT: 1 3.8 2.0 1.9 <total>
4784 # CHECK: [79] Code Region - G80
4786 # CHECK: Iterations: 100
4787 # CHECK-NEXT: Instructions: 1000
4788 # CHECK-NEXT: Total Cycles: 2803
4789 # CHECK-NEXT: Total uOps: 4800
4791 # CHECK: Dispatch Width: 3
4792 # CHECK-NEXT: uOps Per Cycle: 1.71
4793 # CHECK-NEXT: IPC: 0.36
4794 # CHECK-NEXT: Block RThroughput: 28.0
4796 # CHECK: Timeline view:
4797 # CHECK-NEXT: 0123456789 0
4798 # CHECK-NEXT: Index 0123456789 0123456789
4800 # CHECK: [0,0] DeeeeeeeeER . . . . st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
4801 # CHECK-NEXT: [0,1] . DeE----R . . . . add x0, x27, #1
4802 # CHECK-NEXT: [0,2] . D====eeeeER. . . . st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
4803 # CHECK-NEXT: [0,3] . .D===eE--R. . . . add x0, x27, #1
4804 # CHECK-NEXT: [0,4] . . D=====eeeeER . . . st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
4805 # CHECK-NEXT: [0,5] . . D====eE--R . . . add x0, x27, #1
4806 # CHECK-NEXT: [0,6] . . D======eeeeeeeeER . st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
4807 # CHECK-NEXT: [0,7] . . . D===eE------R . add x0, x27, #1
4808 # CHECK-NEXT: [0,8] . . . D=========eeeeER st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
4809 # CHECK-NEXT: [0,9] . . . . D========eE--R add x0, x27, #1
4811 # CHECK: Average Wait times (based on the timeline view):
4812 # CHECK-NEXT: [0]: Executions
4813 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4814 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4815 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4817 # CHECK: [0] [1] [2] [3]
4818 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
4819 # CHECK-NEXT: 1. 1 1.0 1.0 4.0 add x0, x27, #1
4820 # CHECK-NEXT: 2. 1 5.0 5.0 0.0 st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
4821 # CHECK-NEXT: 3. 1 4.0 0.0 2.0 add x0, x27, #1
4822 # CHECK-NEXT: 4. 1 6.0 3.0 0.0 st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
4823 # CHECK-NEXT: 5. 1 5.0 0.0 2.0 add x0, x27, #1
4824 # CHECK-NEXT: 6. 1 7.0 3.0 0.0 st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
4825 # CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1
4826 # CHECK-NEXT: 8. 1 10.0 7.0 0.0 st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
4827 # CHECK-NEXT: 9. 1 9.0 0.0 2.0 add x0, x27, #1
4828 # CHECK-NEXT: 1 5.2 2.0 1.6 <total>
4830 # CHECK: [80] Code Region - G81
4832 # CHECK: Iterations: 100
4833 # CHECK-NEXT: Instructions: 1000
4834 # CHECK-NEXT: Total Cycles: 1905
4835 # CHECK-NEXT: Total uOps: 4000
4837 # CHECK: Dispatch Width: 3
4838 # CHECK-NEXT: uOps Per Cycle: 2.10
4839 # CHECK-NEXT: IPC: 0.52
4840 # CHECK-NEXT: Block RThroughput: 19.0
4842 # CHECK: Timeline view:
4843 # CHECK-NEXT: 0123456789
4844 # CHECK-NEXT: Index 0123456789 0123
4846 # CHECK: [0,0] DeeeeeeeeER . . . st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
4847 # CHECK-NEXT: [0,1] . DeE---R . . . add x0, x27, #1
4848 # CHECK-NEXT: [0,2] . D===eeeeeeeeER . . st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
4849 # CHECK-NEXT: [0,3] . . DeE------R . . add x0, x27, #1
4850 # CHECK-NEXT: [0,4] . . D======eeeER . st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
4851 # CHECK-NEXT: [0,5] . . .D======eE-R . add x0, x27, #1
4852 # CHECK-NEXT: [0,6] . . . D=====eeeER. st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
4853 # CHECK-NEXT: [0,7] . . . D=====eE-R. add x0, x27, #1
4854 # CHECK-NEXT: [0,8] . . . D====eeeER st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
4855 # CHECK-NEXT: [0,9] . . . D====eE-R add x0, x27, #1
4857 # CHECK: Average Wait times (based on the timeline view):
4858 # CHECK-NEXT: [0]: Executions
4859 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4860 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4861 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4863 # CHECK: [0] [1] [2] [3]
4864 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
4865 # CHECK-NEXT: 1. 1 1.0 1.0 3.0 add x0, x27, #1
4866 # CHECK-NEXT: 2. 1 4.0 4.0 0.0 st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
4867 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
4868 # CHECK-NEXT: 4. 1 7.0 7.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
4869 # CHECK-NEXT: 5. 1 7.0 0.0 1.0 add x0, x27, #1
4870 # CHECK-NEXT: 6. 1 6.0 0.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
4871 # CHECK-NEXT: 7. 1 6.0 0.0 1.0 add x0, x27, #1
4872 # CHECK-NEXT: 8. 1 5.0 0.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
4873 # CHECK-NEXT: 9. 1 5.0 0.0 1.0 add x0, x27, #1
4874 # CHECK-NEXT: 1 4.3 1.3 1.2 <total>
4876 # CHECK: [81] Code Region - G82
4878 # CHECK: Iterations: 100
4879 # CHECK-NEXT: Instructions: 1000
4880 # CHECK-NEXT: Total Cycles: 1004
4881 # CHECK-NEXT: Total uOps: 2000
4883 # CHECK: Dispatch Width: 3
4884 # CHECK-NEXT: uOps Per Cycle: 1.99
4885 # CHECK-NEXT: IPC: 1.00
4886 # CHECK-NEXT: Block RThroughput: 6.7
4888 # CHECK: Timeline view:
4890 # CHECK-NEXT: Index 0123456789
4892 # CHECK: [0,0] DeeeER . . st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
4893 # CHECK-NEXT: [0,1] .DeE-R . . add x0, x27, #1
4894 # CHECK-NEXT: [0,2] . DeeeER . . st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
4895 # CHECK-NEXT: [0,3] . DeE-R . . add x0, x27, #1
4896 # CHECK-NEXT: [0,4] . DeeeER. . st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
4897 # CHECK-NEXT: [0,5] . DeE-R. . add x0, x27, #1
4898 # CHECK-NEXT: [0,6] . .DeeeER . st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
4899 # CHECK-NEXT: [0,7] . . DeE-R . add x0, x27, #1
4900 # CHECK-NEXT: [0,8] . . DeeeER st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
4901 # CHECK-NEXT: [0,9] . . DeE-R add x0, x27, #1
4903 # CHECK: Average Wait times (based on the timeline view):
4904 # CHECK-NEXT: [0]: Executions
4905 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4906 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4907 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4909 # CHECK: [0] [1] [2] [3]
4910 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
4911 # CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1
4912 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
4913 # CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1
4914 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
4915 # CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1
4916 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
4917 # CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1
4918 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
4919 # CHECK-NEXT: 9. 1 1.0 0.0 1.0 add x0, x27, #1
4920 # CHECK-NEXT: 1 1.0 0.5 0.5 <total>
4922 # CHECK: [82] Code Region - G83
4924 # CHECK: Iterations: 100
4925 # CHECK-NEXT: Instructions: 800
4926 # CHECK-NEXT: Total Cycles: 1204
4927 # CHECK-NEXT: Total uOps: 2200
4929 # CHECK: Dispatch Width: 3
4930 # CHECK-NEXT: uOps Per Cycle: 1.83
4931 # CHECK-NEXT: IPC: 0.66
4932 # CHECK-NEXT: Block RThroughput: 12.0
4934 # CHECK: Timeline view:
4935 # CHECK-NEXT: 012345
4936 # CHECK-NEXT: Index 0123456789
4938 # CHECK: [0,0] DeeeeER . . st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
4939 # CHECK-NEXT: [0,1] .DeE--R . . add x0, x27, #1
4940 # CHECK-NEXT: [0,2] . D==eeeeER . st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
4941 # CHECK-NEXT: [0,3] . D==eE--R . add x0, x27, #1
4942 # CHECK-NEXT: [0,4] . D====eeeER . st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
4943 # CHECK-NEXT: [0,5] . D====eE-R . add x0, x27, #1
4944 # CHECK-NEXT: [0,6] . .D====eeeER st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
4945 # CHECK-NEXT: [0,7] . . D====eE-R add x0, x27, #1
4947 # CHECK: Average Wait times (based on the timeline view):
4948 # CHECK-NEXT: [0]: Executions
4949 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4950 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4951 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4953 # CHECK: [0] [1] [2] [3]
4954 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
4955 # CHECK-NEXT: 1. 1 1.0 0.0 2.0 add x0, x27, #1
4956 # CHECK-NEXT: 2. 1 3.0 3.0 0.0 st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
4957 # CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1
4958 # CHECK-NEXT: 4. 1 5.0 3.0 0.0 st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
4959 # CHECK-NEXT: 5. 1 5.0 0.0 1.0 add x0, x27, #1
4960 # CHECK-NEXT: 6. 1 5.0 1.0 0.0 st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
4961 # CHECK-NEXT: 7. 1 5.0 0.0 1.0 add x0, x27, #1
4962 # CHECK-NEXT: 1 3.5 1.0 0.8 <total>
4964 # CHECK: [83] Code Region - G84
4966 # CHECK: Iterations: 100
4967 # CHECK-NEXT: Instructions: 400
4968 # CHECK-NEXT: Total Cycles: 403
4969 # CHECK-NEXT: Total uOps: 900
4971 # CHECK: Dispatch Width: 3
4972 # CHECK-NEXT: uOps Per Cycle: 2.23
4973 # CHECK-NEXT: IPC: 0.99
4974 # CHECK-NEXT: Block RThroughput: 3.0
4976 # CHECK: Timeline view:
4977 # CHECK-NEXT: Index 0123456
4979 # CHECK: [0,0] DeER .. stp s1, s2, [x27], #248
4980 # CHECK-NEXT: [0,1] .DeER.. add x0, x27, #1
4981 # CHECK-NEXT: [0,2] . DeeER stp d1, d2, [x27], #496
4982 # CHECK-NEXT: [0,3] . DeER add x0, x27, #1
4984 # CHECK: Average Wait times (based on the timeline view):
4985 # CHECK-NEXT: [0]: Executions
4986 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4987 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4988 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4990 # CHECK: [0] [1] [2] [3]
4991 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp s1, s2, [x27], #248
4992 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
4993 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 stp d1, d2, [x27], #496
4994 # CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1
4995 # CHECK-NEXT: 1 1.0 0.5 0.0 <total>
4997 # CHECK: [84] Code Region - G85
4999 # CHECK: Iterations: 100
5000 # CHECK-NEXT: Instructions: 1000
5001 # CHECK-NEXT: Total Cycles: 1207
5002 # CHECK-NEXT: Total uOps: 2800
5004 # CHECK: Dispatch Width: 3
5005 # CHECK-NEXT: uOps Per Cycle: 2.32
5006 # CHECK-NEXT: IPC: 0.83
5007 # CHECK-NEXT: Block RThroughput: 12.0
5009 # CHECK: Timeline view:
5010 # CHECK-NEXT: 0123456
5011 # CHECK-NEXT: Index 0123456789
5013 # CHECK: [0,0] DeeeeER . .. stp q1, q2, [x27], #992
5014 # CHECK-NEXT: [0,1] . DeE-R . .. add x0, x27, #1
5015 # CHECK-NEXT: [0,2] . D=eER . .. stp s1, s2, [x27, #248]!
5016 # CHECK-NEXT: [0,3] . D=eER . .. add x0, x27, #1
5017 # CHECK-NEXT: [0,4] . D=eeER .. stp d1, d2, [x27, #496]!
5018 # CHECK-NEXT: [0,5] . .D=eER .. add x0, x27, #1
5019 # CHECK-NEXT: [0,6] . . D=eeeeER.. stp q1, q2, [x27, #992]!
5020 # CHECK-NEXT: [0,7] . . DeE--R.. add x0, x27, #1
5021 # CHECK-NEXT: [0,8] . . D==eER. stp w1, w2, [x27], #248
5022 # CHECK-NEXT: [0,9] . . .D==eER add x0, x27, #1
5024 # CHECK: Average Wait times (based on the timeline view):
5025 # CHECK-NEXT: [0]: Executions
5026 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5027 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5028 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5030 # CHECK: [0] [1] [2] [3]
5031 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp q1, q2, [x27], #992
5032 # CHECK-NEXT: 1. 1 1.0 1.0 1.0 add x0, x27, #1
5033 # CHECK-NEXT: 2. 1 2.0 2.0 0.0 stp s1, s2, [x27, #248]!
5034 # CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1
5035 # CHECK-NEXT: 4. 1 2.0 1.0 0.0 stp d1, d2, [x27, #496]!
5036 # CHECK-NEXT: 5. 1 2.0 0.0 0.0 add x0, x27, #1
5037 # CHECK-NEXT: 6. 1 2.0 1.0 0.0 stp q1, q2, [x27, #992]!
5038 # CHECK-NEXT: 7. 1 1.0 0.0 2.0 add x0, x27, #1
5039 # CHECK-NEXT: 8. 1 3.0 3.0 0.0 stp w1, w2, [x27], #248
5040 # CHECK-NEXT: 9. 1 3.0 0.0 0.0 add x0, x27, #1
5041 # CHECK-NEXT: 1 1.9 0.9 0.3 <total>
5043 # CHECK: [85] Code Region - G86
5045 # CHECK: Iterations: 100
5046 # CHECK-NEXT: Instructions: 1000
5047 # CHECK-NEXT: Total Cycles: 1003
5048 # CHECK-NEXT: Total uOps: 2200
5050 # CHECK: Dispatch Width: 3
5051 # CHECK-NEXT: uOps Per Cycle: 2.19
5052 # CHECK-NEXT: IPC: 1.00
5053 # CHECK-NEXT: Block RThroughput: 7.5
5055 # CHECK: Timeline view:
5057 # CHECK-NEXT: Index 0123456789
5059 # CHECK: [0,0] DeeER. . . stp x1, x2, [x27], #496
5060 # CHECK-NEXT: [0,1] .DeER. . . add x0, x27, #1
5061 # CHECK-NEXT: [0,2] . DeER . . stp w1, w2, [x27, #248]!
5062 # CHECK-NEXT: [0,3] . DeER . . add x0, x27, #1
5063 # CHECK-NEXT: [0,4] . DeeER . . stp x1, x2, [x27, #496]!
5064 # CHECK-NEXT: [0,5] . DeER . . add x0, x27, #1
5065 # CHECK-NEXT: [0,6] . .DeER. . str b1, [x27], #254
5066 # CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1
5067 # CHECK-NEXT: [0,8] . . DeER. str h1, [x27], #254
5068 # CHECK-NEXT: [0,9] . . DeER add x0, x27, #1
5070 # CHECK: Average Wait times (based on the timeline view):
5071 # CHECK-NEXT: [0]: Executions
5072 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5073 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5074 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5076 # CHECK: [0] [1] [2] [3]
5077 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp x1, x2, [x27], #496
5078 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
5079 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 stp w1, w2, [x27, #248]!
5080 # CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1
5081 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 stp x1, x2, [x27, #496]!
5082 # CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1
5083 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 str b1, [x27], #254
5084 # CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1
5085 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 str h1, [x27], #254
5086 # CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1
5087 # CHECK-NEXT: 1 1.0 0.5 0.0 <total>
5089 # CHECK: [86] Code Region - G87
5091 # CHECK: Iterations: 100
5092 # CHECK-NEXT: Instructions: 1000
5093 # CHECK-NEXT: Total Cycles: 1003
5094 # CHECK-NEXT: Total uOps: 2100
5096 # CHECK: Dispatch Width: 3
5097 # CHECK-NEXT: uOps Per Cycle: 2.09
5098 # CHECK-NEXT: IPC: 1.00
5099 # CHECK-NEXT: Block RThroughput: 7.5
5101 # CHECK: Timeline view:
5103 # CHECK-NEXT: Index 0123456789
5105 # CHECK: [0,0] DeER . . . str s1, [x27], #254
5106 # CHECK-NEXT: [0,1] .DeER. . . add x0, x27, #1
5107 # CHECK-NEXT: [0,2] . DeER . . str d1, [x27], #254
5108 # CHECK-NEXT: [0,3] . DeER . . add x0, x27, #1
5109 # CHECK-NEXT: [0,4] . DeeER . . str q1, [x27], #254
5110 # CHECK-NEXT: [0,5] . DeER . . add x0, x27, #1
5111 # CHECK-NEXT: [0,6] . .DeER. . str b1, [x27, #254]!
5112 # CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1
5113 # CHECK-NEXT: [0,8] . . DeER. str h1, [x27, #254]!
5114 # CHECK-NEXT: [0,9] . . DeER add x0, x27, #1
5116 # CHECK: Average Wait times (based on the timeline view):
5117 # CHECK-NEXT: [0]: Executions
5118 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5119 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5120 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5122 # CHECK: [0] [1] [2] [3]
5123 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 str s1, [x27], #254
5124 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
5125 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 str d1, [x27], #254
5126 # CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1
5127 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 str q1, [x27], #254
5128 # CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1
5129 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 str b1, [x27, #254]!
5130 # CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1
5131 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 str h1, [x27, #254]!
5132 # CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1
5133 # CHECK-NEXT: 1 1.0 0.5 0.0 <total>
5135 # CHECK: [87] Code Region - G88
5137 # CHECK: Iterations: 100
5138 # CHECK-NEXT: Instructions: 1000
5139 # CHECK-NEXT: Total Cycles: 1003
5140 # CHECK-NEXT: Total uOps: 2100
5142 # CHECK: Dispatch Width: 3
5143 # CHECK-NEXT: uOps Per Cycle: 2.09
5144 # CHECK-NEXT: IPC: 1.00
5145 # CHECK-NEXT: Block RThroughput: 7.5
5147 # CHECK: Timeline view:
5149 # CHECK-NEXT: Index 0123456789
5151 # CHECK: [0,0] DeER . . . str s1, [x27, #254]!
5152 # CHECK-NEXT: [0,1] .DeER. . . add x0, x27, #1
5153 # CHECK-NEXT: [0,2] . DeER . . str d1, [x27, #254]!
5154 # CHECK-NEXT: [0,3] . DeER . . add x0, x27, #1
5155 # CHECK-NEXT: [0,4] . DeeER . . str q1, [x27, #254]!
5156 # CHECK-NEXT: [0,5] . DeER . . add x0, x27, #1
5157 # CHECK-NEXT: [0,6] . .DeER. . str w1, [x27], #254
5158 # CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1
5159 # CHECK-NEXT: [0,8] . . DeER. str x1, [x27], #254
5160 # CHECK-NEXT: [0,9] . . DeER add x0, x27, #1
5162 # CHECK: Average Wait times (based on the timeline view):
5163 # CHECK-NEXT: [0]: Executions
5164 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5165 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5166 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5168 # CHECK: [0] [1] [2] [3]
5169 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 str s1, [x27, #254]!
5170 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
5171 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 str d1, [x27, #254]!
5172 # CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1
5173 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 str q1, [x27, #254]!
5174 # CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1
5175 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 str w1, [x27], #254
5176 # CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1
5177 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 str x1, [x27], #254
5178 # CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1
5179 # CHECK-NEXT: 1 1.0 0.5 0.0 <total>
5181 # CHECK: [88] Code Region - G89
5183 # CHECK: Iterations: 100
5184 # CHECK-NEXT: Instructions: 1000
5185 # CHECK-NEXT: Total Cycles: 1003
5186 # CHECK-NEXT: Total uOps: 2000
5188 # CHECK: Dispatch Width: 3
5189 # CHECK-NEXT: uOps Per Cycle: 1.99
5190 # CHECK-NEXT: IPC: 1.00
5191 # CHECK-NEXT: Block RThroughput: 7.5
5193 # CHECK: Timeline view:
5195 # CHECK-NEXT: Index 0123456789
5197 # CHECK: [0,0] DeER . . . str w1, [x27, #254]!
5198 # CHECK-NEXT: [0,1] .DeER. . . add x0, x27, #1
5199 # CHECK-NEXT: [0,2] . DeER . . str x1, [x27, #254]!
5200 # CHECK-NEXT: [0,3] . DeER . . add x0, x27, #1
5201 # CHECK-NEXT: [0,4] . DeER . . strb w1, [x27], #254
5202 # CHECK-NEXT: [0,5] . DeER . . add x0, x27, #1
5203 # CHECK-NEXT: [0,6] . .DeER. . strb w1, [x27, #254]!
5204 # CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1
5205 # CHECK-NEXT: [0,8] . . DeER. strh w1, [x27], #254
5206 # CHECK-NEXT: [0,9] . . DeER add x0, x27, #1
5208 # CHECK: Average Wait times (based on the timeline view):
5209 # CHECK-NEXT: [0]: Executions
5210 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5211 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5212 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5214 # CHECK: [0] [1] [2] [3]
5215 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 str w1, [x27, #254]!
5216 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
5217 # CHECK-NEXT: 2. 1 1.0 1.0 0.0 str x1, [x27, #254]!
5218 # CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1
5219 # CHECK-NEXT: 4. 1 1.0 1.0 0.0 strb w1, [x27], #254
5220 # CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1
5221 # CHECK-NEXT: 6. 1 1.0 1.0 0.0 strb w1, [x27, #254]!
5222 # CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1
5223 # CHECK-NEXT: 8. 1 1.0 1.0 0.0 strh w1, [x27], #254
5224 # CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1
5225 # CHECK-NEXT: 1 1.0 0.5 0.0 <total>
5227 # CHECK: [89] Code Region - G90
5229 # CHECK: Iterations: 100
5230 # CHECK-NEXT: Instructions: 200
5231 # CHECK-NEXT: Total Cycles: 203
5232 # CHECK-NEXT: Total uOps: 400
5234 # CHECK: Dispatch Width: 3
5235 # CHECK-NEXT: uOps Per Cycle: 1.97
5236 # CHECK-NEXT: IPC: 0.99
5237 # CHECK-NEXT: Block RThroughput: 1.5
5239 # CHECK: Timeline view:
5240 # CHECK-NEXT: Index 01234
5242 # CHECK: [0,0] DeER. strh w1, [x27, #254]!
5243 # CHECK-NEXT: [0,1] .DeER add x0, x27, #1
5245 # CHECK: Average Wait times (based on the timeline view):
5246 # CHECK-NEXT: [0]: Executions
5247 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5248 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5249 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5251 # CHECK: [0] [1] [2] [3]
5252 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 strh w1, [x27, #254]!
5253 # CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1
5254 # CHECK-NEXT: 1 1.0 0.5 0.0 <total>
5256 # CHECK: [90] Code Region - G91
5258 # CHECK: Iterations: 100
5259 # CHECK-NEXT: Instructions: 400
5260 # CHECK-NEXT: Total Cycles: 210
5261 # CHECK-NEXT: Total uOps: 600
5263 # CHECK: Dispatch Width: 3
5264 # CHECK-NEXT: uOps Per Cycle: 2.86
5265 # CHECK-NEXT: IPC: 1.90
5266 # CHECK-NEXT: Block RThroughput: 2.0
5268 # CHECK: Timeline view:
5270 # CHECK-NEXT: Index 0123456789
5272 # CHECK: [0,0] DeeeeER . ldr x1, [x27], #254
5273 # CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1
5274 # CHECK-NEXT: [0,2] .D===eeeeER ldr x2, [x1], #254
5275 # CHECK-NEXT: [0,3] .DeE------R add x0, x27, #1
5277 # CHECK: Average Wait times (based on the timeline view):
5278 # CHECK-NEXT: [0]: Executions
5279 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5280 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5281 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5283 # CHECK: [0] [1] [2] [3]
5284 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr x1, [x27], #254
5285 # CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1
5286 # CHECK-NEXT: 2. 1 4.0 0.0 0.0 ldr x2, [x1], #254
5287 # CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1
5288 # CHECK-NEXT: 1 2.0 0.3 2.0 <total>