Run DCE after a LoopFlatten test to reduce spurious output [nfc]
[llvm-project.git] / llvm / test / tools / llvm-mca / X86 / Znver4 / resources-ssse3.s
blob173c72171aafe680446dc7f780ab56dfaa0d79d5
1 # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2 # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s
4 pabsb %mm0, %mm2
5 pabsb (%rax), %mm2
7 pabsb %xmm0, %xmm2
8 pabsb (%rax), %xmm2
10 pabsd %mm0, %mm2
11 pabsd (%rax), %mm2
13 pabsd %xmm0, %xmm2
14 pabsd (%rax), %xmm2
16 pabsw %mm0, %mm2
17 pabsw (%rax), %mm2
19 pabsw %xmm0, %xmm2
20 pabsw (%rax), %xmm2
22 palignr $1, %mm0, %mm2
23 palignr $1, (%rax), %mm2
25 palignr $1, %xmm0, %xmm2
26 palignr $1, (%rax), %xmm2
28 phaddd %mm0, %mm2
29 phaddd (%rax), %mm2
31 phaddd %xmm0, %xmm2
32 phaddd (%rax), %xmm2
34 phaddsw %mm0, %mm2
35 phaddsw (%rax), %mm2
37 phaddsw %xmm0, %xmm2
38 phaddsw (%rax), %xmm2
40 phaddw %mm0, %mm2
41 phaddw (%rax), %mm2
43 phaddw %xmm0, %xmm2
44 phaddw (%rax), %xmm2
46 phsubd %mm0, %mm2
47 phsubd (%rax), %mm2
49 phsubd %xmm0, %xmm2
50 phsubd (%rax), %xmm2
52 phsubsw %mm0, %mm2
53 phsubsw (%rax), %mm2
55 phsubsw %xmm0, %xmm2
56 phsubsw (%rax), %xmm2
58 phsubw %mm0, %mm2
59 phsubw (%rax), %mm2
61 phsubw %xmm0, %xmm2
62 phsubw (%rax), %xmm2
64 pmaddubsw %mm0, %mm2
65 pmaddubsw (%rax), %mm2
67 pmaddubsw %xmm0, %xmm2
68 pmaddubsw (%rax), %xmm2
70 pmulhrsw %mm0, %mm2
71 pmulhrsw (%rax), %mm2
73 pmulhrsw %xmm0, %xmm2
74 pmulhrsw (%rax), %xmm2
76 pshufb %mm0, %mm2
77 pshufb (%rax), %mm2
79 pshufb %xmm0, %xmm2
80 pshufb (%rax), %xmm2
82 psignb %mm0, %mm2
83 psignb (%rax), %mm2
85 psignb %xmm0, %xmm2
86 psignb (%rax), %xmm2
88 psignd %mm0, %mm2
89 psignd (%rax), %mm2
91 psignd %xmm0, %xmm2
92 psignd (%rax), %xmm2
94 psignw %mm0, %mm2
95 psignw (%rax), %mm2
97 psignw %xmm0, %xmm2
98 psignw (%rax), %xmm2
100 # CHECK: Instruction Info:
101 # CHECK-NEXT: [1]: #uOps
102 # CHECK-NEXT: [2]: Latency
103 # CHECK-NEXT: [3]: RThroughput
104 # CHECK-NEXT: [4]: MayLoad
105 # CHECK-NEXT: [5]: MayStore
106 # CHECK-NEXT: [6]: HasSideEffects (U)
108 # CHECK: [1] [2] [3] [4] [5] [6] Instructions:
109 # CHECK-NEXT: 1 1 0.25 pabsb %mm0, %mm2
110 # CHECK-NEXT: 1 8 0.50 * pabsb (%rax), %mm2
111 # CHECK-NEXT: 1 2 1.00 pabsb %xmm0, %xmm2
112 # CHECK-NEXT: 1 8 0.50 * pabsb (%rax), %xmm2
113 # CHECK-NEXT: 1 1 0.25 pabsd %mm0, %mm2
114 # CHECK-NEXT: 1 8 0.50 * pabsd (%rax), %mm2
115 # CHECK-NEXT: 1 2 1.00 pabsd %xmm0, %xmm2
116 # CHECK-NEXT: 1 8 0.50 * pabsd (%rax), %xmm2
117 # CHECK-NEXT: 1 1 0.25 pabsw %mm0, %mm2
118 # CHECK-NEXT: 1 8 0.50 * pabsw (%rax), %mm2
119 # CHECK-NEXT: 1 2 1.00 pabsw %xmm0, %xmm2
120 # CHECK-NEXT: 1 8 0.50 * pabsw (%rax), %xmm2
121 # CHECK-NEXT: 1 1 0.50 palignr $1, %mm0, %mm2
122 # CHECK-NEXT: 1 8 0.50 * palignr $1, (%rax), %mm2
123 # CHECK-NEXT: 1 2 1.00 palignr $1, %xmm0, %xmm2
124 # CHECK-NEXT: 1 8 0.50 * palignr $1, (%rax), %xmm2
125 # CHECK-NEXT: 3 2 2.00 phaddd %mm0, %mm2
126 # CHECK-NEXT: 4 9 2.00 * phaddd (%rax), %mm2
127 # CHECK-NEXT: 3 2 2.00 phaddd %xmm0, %xmm2
128 # CHECK-NEXT: 3 9 2.00 * phaddd (%rax), %xmm2
129 # CHECK-NEXT: 3 2 2.00 phaddsw %mm0, %mm2
130 # CHECK-NEXT: 4 9 2.00 * phaddsw (%rax), %mm2
131 # CHECK-NEXT: 3 2 2.00 phaddsw %xmm0, %xmm2
132 # CHECK-NEXT: 3 9 2.00 * phaddsw (%rax), %xmm2
133 # CHECK-NEXT: 3 2 2.00 phaddw %mm0, %mm2
134 # CHECK-NEXT: 4 9 2.00 * phaddw (%rax), %mm2
135 # CHECK-NEXT: 3 2 2.00 phaddw %xmm0, %xmm2
136 # CHECK-NEXT: 3 9 2.00 * phaddw (%rax), %xmm2
137 # CHECK-NEXT: 3 2 2.00 phsubd %mm0, %mm2
138 # CHECK-NEXT: 4 9 2.00 * phsubd (%rax), %mm2
139 # CHECK-NEXT: 3 2 2.00 phsubd %xmm0, %xmm2
140 # CHECK-NEXT: 3 9 2.00 * phsubd (%rax), %xmm2
141 # CHECK-NEXT: 3 2 2.00 phsubsw %mm0, %mm2
142 # CHECK-NEXT: 4 9 2.00 * phsubsw (%rax), %mm2
143 # CHECK-NEXT: 3 2 2.00 phsubsw %xmm0, %xmm2
144 # CHECK-NEXT: 3 9 2.00 * phsubsw (%rax), %xmm2
145 # CHECK-NEXT: 3 2 2.00 phsubw %mm0, %mm2
146 # CHECK-NEXT: 4 9 2.00 * phsubw (%rax), %mm2
147 # CHECK-NEXT: 3 2 2.00 phsubw %xmm0, %xmm2
148 # CHECK-NEXT: 3 9 2.00 * phsubw (%rax), %xmm2
149 # CHECK-NEXT: 1 3 0.50 pmaddubsw %mm0, %mm2
150 # CHECK-NEXT: 1 10 0.50 * pmaddubsw (%rax), %mm2
151 # CHECK-NEXT: 1 3 0.50 pmaddubsw %xmm0, %xmm2
152 # CHECK-NEXT: 1 10 0.50 * pmaddubsw (%rax), %xmm2
153 # CHECK-NEXT: 1 3 0.50 pmulhrsw %mm0, %mm2
154 # CHECK-NEXT: 1 10 0.50 * pmulhrsw (%rax), %mm2
155 # CHECK-NEXT: 1 3 0.50 pmulhrsw %xmm0, %xmm2
156 # CHECK-NEXT: 1 10 0.50 * pmulhrsw (%rax), %xmm2
157 # CHECK-NEXT: 1 1 0.50 pshufb %mm0, %mm2
158 # CHECK-NEXT: 1 8 0.50 * pshufb (%rax), %mm2
159 # CHECK-NEXT: 1 1 0.50 pshufb %xmm0, %xmm2
160 # CHECK-NEXT: 1 8 0.50 * pshufb (%rax), %xmm2
161 # CHECK-NEXT: 1 1 0.25 psignb %mm0, %mm2
162 # CHECK-NEXT: 1 8 0.50 * psignb (%rax), %mm2
163 # CHECK-NEXT: 1 2 1.00 psignb %xmm0, %xmm2
164 # CHECK-NEXT: 1 8 0.50 * psignb (%rax), %xmm2
165 # CHECK-NEXT: 1 1 0.25 psignd %mm0, %mm2
166 # CHECK-NEXT: 1 8 0.50 * psignd (%rax), %mm2
167 # CHECK-NEXT: 1 2 1.00 psignd %xmm0, %xmm2
168 # CHECK-NEXT: 1 8 0.50 * psignd (%rax), %xmm2
169 # CHECK-NEXT: 1 1 0.25 psignw %mm0, %mm2
170 # CHECK-NEXT: 1 8 0.50 * psignw (%rax), %mm2
171 # CHECK-NEXT: 1 2 1.00 psignw %xmm0, %xmm2
172 # CHECK-NEXT: 1 8 0.50 * psignw (%rax), %xmm2
174 # CHECK: Resources:
175 # CHECK-NEXT: [0] - Zn4AGU0
176 # CHECK-NEXT: [1] - Zn4AGU1
177 # CHECK-NEXT: [2] - Zn4AGU2
178 # CHECK-NEXT: [3] - Zn4ALU0
179 # CHECK-NEXT: [4] - Zn4ALU1
180 # CHECK-NEXT: [5] - Zn4ALU2
181 # CHECK-NEXT: [6] - Zn4ALU3
182 # CHECK-NEXT: [7] - Zn4BRU1
183 # CHECK-NEXT: [8] - Zn4FP0
184 # CHECK-NEXT: [9] - Zn4FP1
185 # CHECK-NEXT: [10] - Zn4FP2
186 # CHECK-NEXT: [11] - Zn4FP3
187 # CHECK-NEXT: [12.0] - Zn4FP45
188 # CHECK-NEXT: [12.1] - Zn4FP45
189 # CHECK-NEXT: [13] - Zn4FPSt
190 # CHECK-NEXT: [14.0] - Zn4LSU
191 # CHECK-NEXT: [14.1] - Zn4LSU
192 # CHECK-NEXT: [14.2] - Zn4LSU
193 # CHECK-NEXT: [15.0] - Zn4Load
194 # CHECK-NEXT: [15.1] - Zn4Load
195 # CHECK-NEXT: [15.2] - Zn4Load
196 # CHECK-NEXT: [16.0] - Zn4Store
197 # CHECK-NEXT: [16.1] - Zn4Store
199 # CHECK: Resource pressure per iteration:
200 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
201 # CHECK-NEXT: - - - - - - - - 62.50 15.00 9.00 8.50 16.00 16.00 - 10.67 10.67 10.67 10.67 10.67 10.67 - -
203 # CHECK: Resource pressure by instruction:
204 # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
205 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pabsb %mm0, %mm2
206 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsb (%rax), %mm2
207 # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - pabsb %xmm0, %xmm2
208 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsb (%rax), %xmm2
209 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pabsd %mm0, %mm2
210 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsd (%rax), %mm2
211 # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - pabsd %xmm0, %xmm2
212 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsd (%rax), %xmm2
213 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pabsw %mm0, %mm2
214 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsw (%rax), %mm2
215 # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - pabsw %xmm0, %xmm2
216 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsw (%rax), %xmm2
217 # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - palignr $1, %mm0, %mm2
218 # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - palignr $1, (%rax), %mm2
219 # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - palignr $1, %xmm0, %xmm2
220 # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - palignr $1, (%rax), %xmm2
221 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddd %mm0, %mm2
222 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddd (%rax), %mm2
223 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddd %xmm0, %xmm2
224 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddd (%rax), %xmm2
225 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddsw %mm0, %mm2
226 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddsw (%rax), %mm2
227 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddsw %xmm0, %xmm2
228 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddsw (%rax), %xmm2
229 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddw %mm0, %mm2
230 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddw (%rax), %mm2
231 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddw %xmm0, %xmm2
232 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddw (%rax), %xmm2
233 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubd %mm0, %mm2
234 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubd (%rax), %mm2
235 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubd %xmm0, %xmm2
236 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubd (%rax), %xmm2
237 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubsw %mm0, %mm2
238 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubsw (%rax), %mm2
239 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubsw %xmm0, %xmm2
240 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubsw (%rax), %xmm2
241 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubw %mm0, %mm2
242 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubw (%rax), %mm2
243 # CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubw %xmm0, %xmm2
244 # CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubw (%rax), %xmm2
245 # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmaddubsw %mm0, %mm2
246 # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaddubsw (%rax), %mm2
247 # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmaddubsw %xmm0, %xmm2
248 # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaddubsw (%rax), %xmm2
249 # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhrsw %mm0, %mm2
250 # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhrsw (%rax), %mm2
251 # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhrsw %xmm0, %xmm2
252 # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhrsw (%rax), %xmm2
253 # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufb %mm0, %mm2
254 # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufb (%rax), %mm2
255 # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufb %xmm0, %xmm2
256 # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufb (%rax), %xmm2
257 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psignb %mm0, %mm2
258 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignb (%rax), %mm2
259 # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - psignb %xmm0, %xmm2
260 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignb (%rax), %xmm2
261 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psignd %mm0, %mm2
262 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignd (%rax), %mm2
263 # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - psignd %xmm0, %xmm2
264 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignd (%rax), %xmm2
265 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psignw %mm0, %mm2
266 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignw (%rax), %mm2
267 # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - psignw %xmm0, %xmm2
268 # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignw (%rax), %xmm2