1 # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2 # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=bdver2 -iterations=1 -resource-pressure=false -instruction-info=false -dispatch-stats -register-file-stats -timeline < %s | FileCheck %s
4 vdivps
%ymm0
, %ymm0
, %ymm1
5 vaddps
%ymm0
, %ymm0
, %ymm2
6 vaddps
%ymm0
, %ymm0
, %ymm3
7 vaddps
%ymm0
, %ymm0
, %ymm4
8 vaddps
%ymm0
, %ymm0
, %ymm5
9 vaddps
%ymm0
, %ymm0
, %ymm6
10 vaddps
%ymm0
, %ymm0
, %ymm7
11 vaddps
%ymm0
, %ymm0
, %ymm8
12 vaddps
%ymm0
, %ymm0
, %ymm9
13 vaddps
%ymm0
, %ymm0
, %ymm10
14 vaddps
%ymm0
, %ymm0
, %ymm11
15 vaddps
%ymm0
, %ymm0
, %ymm12
16 vaddps
%ymm0
, %ymm0
, %ymm13
17 vaddps
%ymm0
, %ymm0
, %ymm14
18 vaddps
%ymm0
, %ymm0
, %ymm15
19 vaddps
%ymm2
, %ymm0
, %ymm0
20 vaddps
%ymm2
, %ymm0
, %ymm3
21 vaddps
%ymm2
, %ymm0
, %ymm4
22 vaddps
%ymm2
, %ymm0
, %ymm5
23 vaddps
%ymm2
, %ymm0
, %ymm6
24 vaddps
%ymm2
, %ymm0
, %ymm7
25 vaddps
%ymm2
, %ymm0
, %ymm8
26 vaddps
%ymm2
, %ymm0
, %ymm9
27 vaddps
%ymm2
, %ymm0
, %ymm10
28 vaddps
%ymm2
, %ymm0
, %ymm11
29 vaddps
%ymm2
, %ymm0
, %ymm12
30 vaddps
%ymm2
, %ymm0
, %ymm13
31 vaddps
%ymm2
, %ymm0
, %ymm14
32 vaddps
%ymm2
, %ymm0
, %ymm15
33 vaddps
%ymm3
, %ymm0
, %ymm2
34 vaddps
%ymm3
, %ymm0
, %ymm4
35 vaddps
%ymm3
, %ymm0
, %ymm5
36 vaddps
%ymm3
, %ymm0
, %ymm6
38 # CHECK: Iterations: 1
39 # CHECK-NEXT: Instructions: 33
40 # CHECK-NEXT: Total Cycles: 48
41 # CHECK-NEXT: Total uOps: 66
43 # CHECK: Dispatch Width: 4
44 # CHECK-NEXT: uOps Per Cycle: 1.38
45 # CHECK-NEXT: IPC: 0.69
46 # CHECK-NEXT: Block RThroughput: 41.0
48 # CHECK: Dynamic Dispatch Stall Cycles:
49 # CHECK-NEXT: RAT - Register unavailable: 0
50 # CHECK-NEXT: RCU - Retire tokens unavailable: 0
51 # CHECK-NEXT: SCHEDQ - Scheduler full: 0
52 # CHECK-NEXT: LQ - Load queue full: 0
53 # CHECK-NEXT: SQ - Store queue full: 0
54 # CHECK-NEXT: GROUP - Static restrictions on the dispatch group: 0
56 # CHECK: Dispatch Logic - number of cycles where we saw N micro opcodes dispatched:
57 # CHECK-NEXT: [# dispatched], [# cycles]
58 # CHECK-NEXT: 0, 31 (64.6%)
59 # CHECK-NEXT: 2, 1 (2.1%)
60 # CHECK-NEXT: 4, 16 (33.3%)
62 # CHECK: Register File statistics:
63 # CHECK-NEXT: Total number of mappings created: 66
64 # CHECK-NEXT: Max number of mappings used: 54
66 # CHECK: * Register File #1 -- PdFpuPRF:
67 # CHECK-NEXT: Number of physical registers: 160
68 # CHECK-NEXT: Total number of mappings created: 66
69 # CHECK-NEXT: Max number of mappings used: 54
71 # CHECK: * Register File #2 -- PdIntegerPRF:
72 # CHECK-NEXT: Number of physical registers: 96
73 # CHECK-NEXT: Total number of mappings created: 0
74 # CHECK-NEXT: Max number of mappings used: 0
76 # CHECK: Timeline view:
77 # CHECK-NEXT: 0123456789 0123456789
78 # CHECK-NEXT: Index 0123456789 0123456789 01234567
80 # CHECK: [0,0] DeeeeeeeeeER . . . . . . . . vdivps %ymm0, %ymm0, %ymm1
81 # CHECK-NEXT: [0,1] DeeeeeE----R . . . . . . . . vaddps %ymm0, %ymm0, %ymm2
82 # CHECK-NEXT: [0,2] .D=eeeeeE--R . . . . . . . . vaddps %ymm0, %ymm0, %ymm3
83 # CHECK-NEXT: [0,3] .D===eeeeeER . . . . . . . . vaddps %ymm0, %ymm0, %ymm4
84 # CHECK-NEXT: [0,4] . D====eeeeeER . . . . . . . . vaddps %ymm0, %ymm0, %ymm5
85 # CHECK-NEXT: [0,5] . D======eeeeeER . . . . . . . vaddps %ymm0, %ymm0, %ymm6
86 # CHECK-NEXT: [0,6] . D=======eeeeeER . . . . . . . vaddps %ymm0, %ymm0, %ymm7
87 # CHECK-NEXT: [0,7] . D===========eeeeeER . . . . . . vaddps %ymm0, %ymm0, %ymm8
88 # CHECK-NEXT: [0,8] . D============eeeeeER . . . . . . vaddps %ymm0, %ymm0, %ymm9
89 # CHECK-NEXT: [0,9] . D==============eeeeeER . . . . . vaddps %ymm0, %ymm0, %ymm10
90 # CHECK-NEXT: [0,10] . D==============eeeeeER . . . . . vaddps %ymm0, %ymm0, %ymm11
91 # CHECK-NEXT: [0,11] . D===============eeeeeER . . . . . vaddps %ymm0, %ymm0, %ymm12
92 # CHECK-NEXT: [0,12] . .D===============eeeeeER . . . . . vaddps %ymm0, %ymm0, %ymm13
93 # CHECK-NEXT: [0,13] . .D=================eeeeeER . . . . vaddps %ymm0, %ymm0, %ymm14
94 # CHECK-NEXT: [0,14] . . D=================eeeeeER . . . . vaddps %ymm0, %ymm0, %ymm15
95 # CHECK-NEXT: [0,15] . . D=====eeeeeE------------R . . . . vaddps %ymm2, %ymm0, %ymm0
96 # CHECK-NEXT: [0,16] . . D==============eeeeeE--R . . . . vaddps %ymm2, %ymm0, %ymm3
97 # CHECK-NEXT: [0,17] . . D=================eeeeeER . . . . vaddps %ymm2, %ymm0, %ymm4
98 # CHECK-NEXT: [0,18] . . D=================eeeeeER . . . . vaddps %ymm2, %ymm0, %ymm5
99 # CHECK-NEXT: [0,19] . . D==================eeeeeER. . . . vaddps %ymm2, %ymm0, %ymm6
100 # CHECK-NEXT: [0,20] . . D==================eeeeeER . . . vaddps %ymm2, %ymm0, %ymm7
101 # CHECK-NEXT: [0,21] . . D===================eeeeeER . . . vaddps %ymm2, %ymm0, %ymm8
102 # CHECK-NEXT: [0,22] . . .D===================eeeeeER . . . vaddps %ymm2, %ymm0, %ymm9
103 # CHECK-NEXT: [0,23] . . .D====================eeeeeER . . . vaddps %ymm2, %ymm0, %ymm10
104 # CHECK-NEXT: [0,24] . . . D====================eeeeeER. . . vaddps %ymm2, %ymm0, %ymm11
105 # CHECK-NEXT: [0,25] . . . D=====================eeeeeER . . vaddps %ymm2, %ymm0, %ymm12
106 # CHECK-NEXT: [0,26] . . . D=====================eeeeeER . . vaddps %ymm2, %ymm0, %ymm13
107 # CHECK-NEXT: [0,27] . . . D======================eeeeeER . . vaddps %ymm2, %ymm0, %ymm14
108 # CHECK-NEXT: [0,28] . . . D======================eeeeeER . . vaddps %ymm2, %ymm0, %ymm15
109 # CHECK-NEXT: [0,29] . . . D=======================eeeeeER. . vaddps %ymm3, %ymm0, %ymm2
110 # CHECK-NEXT: [0,30] . . . D=======================eeeeeER . vaddps %ymm3, %ymm0, %ymm4
111 # CHECK-NEXT: [0,31] . . . D========================eeeeeER. vaddps %ymm3, %ymm0, %ymm5
112 # CHECK-NEXT: [0,32] . . . .D========================eeeeeER vaddps %ymm3, %ymm0, %ymm6
114 # CHECK: Average Wait times (based on the timeline view):
115 # CHECK-NEXT: [0]: Executions
116 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
117 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
118 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
120 # CHECK: [0] [1] [2] [3]
121 # CHECK-NEXT: 0. 1 1.0 1.0 0.0 vdivps %ymm0, %ymm0, %ymm1
122 # CHECK-NEXT: 1. 1 1.0 1.0 4.0 vaddps %ymm0, %ymm0, %ymm2
123 # CHECK-NEXT: 2. 1 2.0 2.0 2.0 vaddps %ymm0, %ymm0, %ymm3
124 # CHECK-NEXT: 3. 1 4.0 4.0 0.0 vaddps %ymm0, %ymm0, %ymm4
125 # CHECK-NEXT: 4. 1 5.0 5.0 0.0 vaddps %ymm0, %ymm0, %ymm5
126 # CHECK-NEXT: 5. 1 7.0 7.0 0.0 vaddps %ymm0, %ymm0, %ymm6
127 # CHECK-NEXT: 6. 1 8.0 8.0 0.0 vaddps %ymm0, %ymm0, %ymm7
128 # CHECK-NEXT: 7. 1 12.0 12.0 0.0 vaddps %ymm0, %ymm0, %ymm8
129 # CHECK-NEXT: 8. 1 13.0 13.0 0.0 vaddps %ymm0, %ymm0, %ymm9
130 # CHECK-NEXT: 9. 1 15.0 15.0 0.0 vaddps %ymm0, %ymm0, %ymm10
131 # CHECK-NEXT: 10. 1 15.0 15.0 0.0 vaddps %ymm0, %ymm0, %ymm11
132 # CHECK-NEXT: 11. 1 16.0 16.0 0.0 vaddps %ymm0, %ymm0, %ymm12
133 # CHECK-NEXT: 12. 1 16.0 16.0 0.0 vaddps %ymm0, %ymm0, %ymm13
134 # CHECK-NEXT: 13. 1 18.0 18.0 0.0 vaddps %ymm0, %ymm0, %ymm14
135 # CHECK-NEXT: 14. 1 18.0 18.0 0.0 vaddps %ymm0, %ymm0, %ymm15
136 # CHECK-NEXT: 15. 1 6.0 6.0 12.0 vaddps %ymm2, %ymm0, %ymm0
137 # CHECK-NEXT: 16. 1 15.0 5.0 2.0 vaddps %ymm2, %ymm0, %ymm3
138 # CHECK-NEXT: 17. 1 18.0 8.0 0.0 vaddps %ymm2, %ymm0, %ymm4
139 # CHECK-NEXT: 18. 1 18.0 9.0 0.0 vaddps %ymm2, %ymm0, %ymm5
140 # CHECK-NEXT: 19. 1 19.0 10.0 0.0 vaddps %ymm2, %ymm0, %ymm6
141 # CHECK-NEXT: 20. 1 19.0 11.0 0.0 vaddps %ymm2, %ymm0, %ymm7
142 # CHECK-NEXT: 21. 1 20.0 12.0 0.0 vaddps %ymm2, %ymm0, %ymm8
143 # CHECK-NEXT: 22. 1 20.0 13.0 0.0 vaddps %ymm2, %ymm0, %ymm9
144 # CHECK-NEXT: 23. 1 21.0 14.0 0.0 vaddps %ymm2, %ymm0, %ymm10
145 # CHECK-NEXT: 24. 1 21.0 15.0 0.0 vaddps %ymm2, %ymm0, %ymm11
146 # CHECK-NEXT: 25. 1 22.0 16.0 0.0 vaddps %ymm2, %ymm0, %ymm12
147 # CHECK-NEXT: 26. 1 22.0 17.0 0.0 vaddps %ymm2, %ymm0, %ymm13
148 # CHECK-NEXT: 27. 1 23.0 18.0 0.0 vaddps %ymm2, %ymm0, %ymm14
149 # CHECK-NEXT: 28. 1 23.0 19.0 0.0 vaddps %ymm2, %ymm0, %ymm15
150 # CHECK-NEXT: 29. 1 24.0 10.0 0.0 vaddps %ymm3, %ymm0, %ymm2
151 # CHECK-NEXT: 30. 1 24.0 11.0 0.0 vaddps %ymm3, %ymm0, %ymm4
152 # CHECK-NEXT: 31. 1 25.0 12.0 0.0 vaddps %ymm3, %ymm0, %ymm5
153 # CHECK-NEXT: 32. 1 25.0 13.0 0.0 vaddps %ymm3, %ymm0, %ymm6