1 # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2 # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -timeline -iterations=2 < %s | FileCheck %s
4 # PR51494: A read-advance on the implicit read of EDX/RDX was missing.
7 mulxl
(%rdi
), %eax
, %edx
11 mulxq
(%rdi
), %rax
, %rdx
14 # CHECK: [0] Code Region
16 # CHECK: Iterations: 2
17 # CHECK-NEXT: Instructions: 2
18 # CHECK-NEXT: Total Cycles: 15
19 # CHECK-NEXT: Total uOps: 4
21 # CHECK: Dispatch Width: 6
22 # CHECK-NEXT: uOps Per Cycle: 0.27
23 # CHECK-NEXT: IPC: 0.13
24 # CHECK-NEXT: Block RThroughput: 1.0
26 # CHECK: Instruction Info:
27 # CHECK-NEXT: [1]: #uOps
28 # CHECK-NEXT: [2]: Latency
29 # CHECK-NEXT: [3]: RThroughput
30 # CHECK-NEXT: [4]: MayLoad
31 # CHECK-NEXT: [5]: MayStore
32 # CHECK-NEXT: [6]: HasSideEffects (U)
34 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
35 # CHECK-NEXT: 2 8 1.00 * mulxl (%rdi), %eax, %edx
38 # CHECK-NEXT: [0] - Zn3AGU0
39 # CHECK-NEXT: [1] - Zn3AGU1
40 # CHECK-NEXT: [2] - Zn3AGU2
41 # CHECK-NEXT: [3] - Zn3ALU0
42 # CHECK-NEXT: [4] - Zn3ALU1
43 # CHECK-NEXT: [5] - Zn3ALU2
44 # CHECK-NEXT: [6] - Zn3ALU3
45 # CHECK-NEXT: [7] - Zn3BRU1
46 # CHECK-NEXT: [8] - Zn3FPP0
47 # CHECK-NEXT: [9] - Zn3FPP1
48 # CHECK-NEXT: [10] - Zn3FPP2
49 # CHECK-NEXT: [11] - Zn3FPP3
50 # CHECK-NEXT: [12.0] - Zn3FPP45
51 # CHECK-NEXT: [12.1] - Zn3FPP45
52 # CHECK-NEXT: [13] - Zn3FPSt
53 # CHECK-NEXT: [14.0] - Zn3LSU
54 # CHECK-NEXT: [14.1] - Zn3LSU
55 # CHECK-NEXT: [14.2] - Zn3LSU
56 # CHECK-NEXT: [15.0] - Zn3Load
57 # CHECK-NEXT: [15.1] - Zn3Load
58 # CHECK-NEXT: [15.2] - Zn3Load
59 # CHECK-NEXT: [16.0] - Zn3Store
60 # CHECK-NEXT: [16.1] - Zn3Store
62 # CHECK: Resource pressure per iteration:
63 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
64 # CHECK-NEXT: - 0.50 0.50 - 1.00 - - - - - - - - - - - 0.50 0.50 - 0.50 0.50 - -
66 # CHECK: Resource pressure by instruction:
67 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
68 # CHECK-NEXT: - 0.50 0.50 - 1.00 - - - - - - - - - - - 0.50 0.50 - 0.50 0.50 - - mulxl (%rdi), %eax, %edx
70 # CHECK: Timeline view:
72 # CHECK-NEXT: Index 0123456789
74 # CHECK: [0,0] DeeeeeeeeER . mulxl (%rdi), %eax, %edx
75 # CHECK-NEXT: [1,0] D====eeeeeeeeER mulxl (%rdi), %eax, %edx
77 # CHECK: Average Wait times (based on the timeline view):
78 # CHECK-NEXT: [0]: Executions
79 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
80 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
81 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
83 # CHECK: [0] [1] [2] [3]
84 # CHECK-NEXT: 0. 2 3.0 0.5 0.0 mulxl (%rdi), %eax, %edx
86 # CHECK: [1] Code Region
88 # CHECK: Iterations: 2
89 # CHECK-NEXT: Instructions: 2
90 # CHECK-NEXT: Total Cycles: 15
91 # CHECK-NEXT: Total uOps: 4
93 # CHECK: Dispatch Width: 6
94 # CHECK-NEXT: uOps Per Cycle: 0.27
95 # CHECK-NEXT: IPC: 0.13
96 # CHECK-NEXT: Block RThroughput: 1.0
98 # CHECK: Instruction Info:
99 # CHECK-NEXT: [1]: #uOps
100 # CHECK-NEXT: [2]: Latency
101 # CHECK-NEXT: [3]: RThroughput
102 # CHECK-NEXT: [4]: MayLoad
103 # CHECK-NEXT: [5]: MayStore
104 # CHECK-NEXT: [6]: HasSideEffects (U)
106 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
107 # CHECK-NEXT: 2 8 1.00 * mulxq (%rdi), %rax, %rdx
110 # CHECK-NEXT: [0] - Zn3AGU0
111 # CHECK-NEXT: [1] - Zn3AGU1
112 # CHECK-NEXT: [2] - Zn3AGU2
113 # CHECK-NEXT: [3] - Zn3ALU0
114 # CHECK-NEXT: [4] - Zn3ALU1
115 # CHECK-NEXT: [5] - Zn3ALU2
116 # CHECK-NEXT: [6] - Zn3ALU3
117 # CHECK-NEXT: [7] - Zn3BRU1
118 # CHECK-NEXT: [8] - Zn3FPP0
119 # CHECK-NEXT: [9] - Zn3FPP1
120 # CHECK-NEXT: [10] - Zn3FPP2
121 # CHECK-NEXT: [11] - Zn3FPP3
122 # CHECK-NEXT: [12.0] - Zn3FPP45
123 # CHECK-NEXT: [12.1] - Zn3FPP45
124 # CHECK-NEXT: [13] - Zn3FPSt
125 # CHECK-NEXT: [14.0] - Zn3LSU
126 # CHECK-NEXT: [14.1] - Zn3LSU
127 # CHECK-NEXT: [14.2] - Zn3LSU
128 # CHECK-NEXT: [15.0] - Zn3Load
129 # CHECK-NEXT: [15.1] - Zn3Load
130 # CHECK-NEXT: [15.2] - Zn3Load
131 # CHECK-NEXT: [16.0] - Zn3Store
132 # CHECK-NEXT: [16.1] - Zn3Store
134 # CHECK: Resource pressure per iteration:
135 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
136 # CHECK-NEXT: - 0.50 0.50 - 1.00 - - - - - - - - - - - 0.50 0.50 - 0.50 0.50 - -
138 # CHECK: Resource pressure by instruction:
139 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
140 # CHECK-NEXT: - 0.50 0.50 - 1.00 - - - - - - - - - - - 0.50 0.50 - 0.50 0.50 - - mulxq (%rdi), %rax, %rdx
142 # CHECK: Timeline view:
144 # CHECK-NEXT: Index 0123456789
146 # CHECK: [0,0] DeeeeeeeeER . mulxq (%rdi), %rax, %rdx
147 # CHECK-NEXT: [1,0] D====eeeeeeeeER mulxq (%rdi), %rax, %rdx
149 # CHECK: Average Wait times (based on the timeline view):
150 # CHECK-NEXT: [0]: Executions
151 # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
152 # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
153 # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
155 # CHECK: [0] [1] [2] [3]
156 # CHECK-NEXT: 0. 2 3.0 0.5 0.0 mulxq (%rdi), %rax, %rdx