Run DCE after a LoopFlatten test to reduce spurious output [nfc]
[llvm-project.git] / llvm / test / CodeGen / PowerPC / test-vector-insert.ll
blob087f2244f0f7d064b59d0daa0976a23889d65ae1
1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
3 ; RUN:  -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
4 ; RUN:  -mcpu=pwr7 < %s | FileCheck %s --check-prefix=CHECK-LE-P7
5 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
6 ; RUN:  -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
7 ; RUN:  -mcpu=pwr8 < %s | FileCheck %s --check-prefix=CHECK-LE-P8
8 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
9 ; RUN:  -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
10 ; RUN:  -mcpu=pwr9 < %s | FileCheck %s --check-prefix=CHECK-LE-P9
11 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-linux-gnu \
12 ; RUN:  -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
13 ; RUN:  -mcpu=pwr7 < %s | FileCheck %s --check-prefix=CHECK-BE-P7
14 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-linux-gnu \
15 ; RUN:  -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
16 ; RUN:  -mcpu=pwr8 < %s | FileCheck %s --check-prefix=CHECK-BE-P8
17 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-linux-gnu \
18 ; RUN:  -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
19 ; RUN:  -mcpu=pwr9 < %s | FileCheck %s --check-prefix=CHECK-BE-P9
20 ; xscvdpsxws and xscvdpsxws is only available on Power7 and above
21 ; Codgen is different for Power7, Power8, and Power9.
23 define dso_local <4 x i32> @test(<4 x i32> %a, double %b) {
24 ; CHECK-LE-P7-LABEL: test:
25 ; CHECK-LE-P7:       # %bb.0: # %entry
26 ; CHECK-LE-P7-NEXT:    xscvdpsxws f0, f1
27 ; CHECK-LE-P7-NEXT:    addi r3, r1, -4
28 ; CHECK-LE-P7-NEXT:    stfiwx f0, 0, r3
29 ; CHECK-LE-P7-NEXT:    lwz r3, -4(r1)
30 ; CHECK-LE-P7-NEXT:    stw r3, -32(r1)
31 ; CHECK-LE-P7-NEXT:    addis r3, r2, .LCPI0_0@toc@ha
32 ; CHECK-LE-P7-NEXT:    addi r3, r3, .LCPI0_0@toc@l
33 ; CHECK-LE-P7-NEXT:    lxvd2x vs0, 0, r3
34 ; CHECK-LE-P7-NEXT:    addi r3, r1, -32
35 ; CHECK-LE-P7-NEXT:    xxswapd v3, vs0
36 ; CHECK-LE-P7-NEXT:    lxvd2x vs0, 0, r3
37 ; CHECK-LE-P7-NEXT:    xxswapd v4, vs0
38 ; CHECK-LE-P7-NEXT:    vperm v2, v4, v2, v3
39 ; CHECK-LE-P7-NEXT:    blr
41 ; CHECK-LE-P8-LABEL: test:
42 ; CHECK-LE-P8:       # %bb.0: # %entry
43 ; CHECK-LE-P8-NEXT:    addis r3, r2, .LCPI0_0@toc@ha
44 ; CHECK-LE-P8-NEXT:    xscvdpsxws v4, f1
45 ; CHECK-LE-P8-NEXT:    addi r3, r3, .LCPI0_0@toc@l
46 ; CHECK-LE-P8-NEXT:    lxvd2x vs0, 0, r3
47 ; CHECK-LE-P8-NEXT:    xxswapd v3, vs0
48 ; CHECK-LE-P8-NEXT:    vperm v2, v4, v2, v3
49 ; CHECK-LE-P8-NEXT:    blr
51 ; CHECK-LE-P9-LABEL: test:
52 ; CHECK-LE-P9:       # %bb.0: # %entry
53 ; CHECK-LE-P9-NEXT:    xscvdpsxws f0, f1
54 ; CHECK-LE-P9-NEXT:    xxinsertw v2, vs0, 0
55 ; CHECK-LE-P9-NEXT:    blr
57 ; CHECK-BE-P7-LABEL: test:
58 ; CHECK-BE-P7:       # %bb.0: # %entry
59 ; CHECK-BE-P7-NEXT:    xscvdpsxws f0, f1
60 ; CHECK-BE-P7-NEXT:    addi r3, r1, -4
61 ; CHECK-BE-P7-NEXT:    stfiwx f0, 0, r3
62 ; CHECK-BE-P7-NEXT:    lwz r3, -4(r1)
63 ; CHECK-BE-P7-NEXT:    stw r3, -32(r1)
64 ; CHECK-BE-P7-NEXT:    addis r3, r2, .LCPI0_0@toc@ha
65 ; CHECK-BE-P7-NEXT:    addi r3, r3, .LCPI0_0@toc@l
66 ; CHECK-BE-P7-NEXT:    lxvw4x v3, 0, r3
67 ; CHECK-BE-P7-NEXT:    addi r3, r1, -32
68 ; CHECK-BE-P7-NEXT:    lxvw4x v4, 0, r3
69 ; CHECK-BE-P7-NEXT:    vperm v2, v2, v4, v3
70 ; CHECK-BE-P7-NEXT:    blr
72 ; CHECK-BE-P8-LABEL: test:
73 ; CHECK-BE-P8:       # %bb.0: # %entry
74 ; CHECK-BE-P8-NEXT:    addis r3, r2, .LCPI0_0@toc@ha
75 ; CHECK-BE-P8-NEXT:    xscvdpsxws v4, f1
76 ; CHECK-BE-P8-NEXT:    addi r3, r3, .LCPI0_0@toc@l
77 ; CHECK-BE-P8-NEXT:    lxvw4x v3, 0, r3
78 ; CHECK-BE-P8-NEXT:    vperm v2, v2, v4, v3
79 ; CHECK-BE-P8-NEXT:    blr
81 ; CHECK-BE-P9-LABEL: test:
82 ; CHECK-BE-P9:       # %bb.0: # %entry
83 ; CHECK-BE-P9-NEXT:    xscvdpsxws f0, f1
84 ; CHECK-BE-P9-NEXT:    xxinsertw v2, vs0, 12
85 ; CHECK-BE-P9-NEXT:    blr
86 entry:
87   %conv = fptosi double %b to i32
88   %vecins = insertelement <4 x i32> %a, i32 %conv, i32 3
89   ret <4 x i32> %vecins
92 define dso_local <4 x i32> @test2(<4 x i32> %a, float %b) {
93 ; CHECK-LE-P7-LABEL: test2:
94 ; CHECK-LE-P7:       # %bb.0: # %entry
95 ; CHECK-LE-P7-NEXT:    xscvdpsxws f0, f1
96 ; CHECK-LE-P7-NEXT:    addi r3, r1, -4
97 ; CHECK-LE-P7-NEXT:    stfiwx f0, 0, r3
98 ; CHECK-LE-P7-NEXT:    lwz r3, -4(r1)
99 ; CHECK-LE-P7-NEXT:    stw r3, -32(r1)
100 ; CHECK-LE-P7-NEXT:    addis r3, r2, .LCPI1_0@toc@ha
101 ; CHECK-LE-P7-NEXT:    addi r3, r3, .LCPI1_0@toc@l
102 ; CHECK-LE-P7-NEXT:    lxvd2x vs0, 0, r3
103 ; CHECK-LE-P7-NEXT:    addi r3, r1, -32
104 ; CHECK-LE-P7-NEXT:    xxswapd v3, vs0
105 ; CHECK-LE-P7-NEXT:    lxvd2x vs0, 0, r3
106 ; CHECK-LE-P7-NEXT:    xxswapd v4, vs0
107 ; CHECK-LE-P7-NEXT:    vperm v2, v4, v2, v3
108 ; CHECK-LE-P7-NEXT:    blr
110 ; CHECK-LE-P8-LABEL: test2:
111 ; CHECK-LE-P8:       # %bb.0: # %entry
112 ; CHECK-LE-P8-NEXT:    addis r3, r2, .LCPI1_0@toc@ha
113 ; CHECK-LE-P8-NEXT:    xscvdpsxws v4, f1
114 ; CHECK-LE-P8-NEXT:    addi r3, r3, .LCPI1_0@toc@l
115 ; CHECK-LE-P8-NEXT:    lxvd2x vs0, 0, r3
116 ; CHECK-LE-P8-NEXT:    xxswapd v3, vs0
117 ; CHECK-LE-P8-NEXT:    vperm v2, v4, v2, v3
118 ; CHECK-LE-P8-NEXT:    blr
120 ; CHECK-LE-P9-LABEL: test2:
121 ; CHECK-LE-P9:       # %bb.0: # %entry
122 ; CHECK-LE-P9-NEXT:    xscvdpsxws f0, f1
123 ; CHECK-LE-P9-NEXT:    xxinsertw v2, vs0, 0
124 ; CHECK-LE-P9-NEXT:    blr
126 ; CHECK-BE-P7-LABEL: test2:
127 ; CHECK-BE-P7:       # %bb.0: # %entry
128 ; CHECK-BE-P7-NEXT:    xscvdpsxws f0, f1
129 ; CHECK-BE-P7-NEXT:    addi r3, r1, -4
130 ; CHECK-BE-P7-NEXT:    stfiwx f0, 0, r3
131 ; CHECK-BE-P7-NEXT:    lwz r3, -4(r1)
132 ; CHECK-BE-P7-NEXT:    stw r3, -32(r1)
133 ; CHECK-BE-P7-NEXT:    addis r3, r2, .LCPI1_0@toc@ha
134 ; CHECK-BE-P7-NEXT:    addi r3, r3, .LCPI1_0@toc@l
135 ; CHECK-BE-P7-NEXT:    lxvw4x v3, 0, r3
136 ; CHECK-BE-P7-NEXT:    addi r3, r1, -32
137 ; CHECK-BE-P7-NEXT:    lxvw4x v4, 0, r3
138 ; CHECK-BE-P7-NEXT:    vperm v2, v2, v4, v3
139 ; CHECK-BE-P7-NEXT:    blr
141 ; CHECK-BE-P8-LABEL: test2:
142 ; CHECK-BE-P8:       # %bb.0: # %entry
143 ; CHECK-BE-P8-NEXT:    addis r3, r2, .LCPI1_0@toc@ha
144 ; CHECK-BE-P8-NEXT:    xscvdpsxws v4, f1
145 ; CHECK-BE-P8-NEXT:    addi r3, r3, .LCPI1_0@toc@l
146 ; CHECK-BE-P8-NEXT:    lxvw4x v3, 0, r3
147 ; CHECK-BE-P8-NEXT:    vperm v2, v2, v4, v3
148 ; CHECK-BE-P8-NEXT:    blr
150 ; CHECK-BE-P9-LABEL: test2:
151 ; CHECK-BE-P9:       # %bb.0: # %entry
152 ; CHECK-BE-P9-NEXT:    xscvdpsxws f0, f1
153 ; CHECK-BE-P9-NEXT:    xxinsertw v2, vs0, 12
154 ; CHECK-BE-P9-NEXT:    blr
155 entry:
156   %conv = fptosi float %b to i32
157   %vecins = insertelement <4 x i32> %a, i32 %conv, i32 3
158   ret <4 x i32> %vecins
161 define dso_local <4 x i32> @test3(<4 x i32> %a, double %b) {
162 ; CHECK-LE-P7-LABEL: test3:
163 ; CHECK-LE-P7:       # %bb.0: # %entry
164 ; CHECK-LE-P7-NEXT:    xscvdpuxws f0, f1
165 ; CHECK-LE-P7-NEXT:    addi r3, r1, -4
166 ; CHECK-LE-P7-NEXT:    stfiwx f0, 0, r3
167 ; CHECK-LE-P7-NEXT:    lwz r3, -4(r1)
168 ; CHECK-LE-P7-NEXT:    stw r3, -32(r1)
169 ; CHECK-LE-P7-NEXT:    addis r3, r2, .LCPI2_0@toc@ha
170 ; CHECK-LE-P7-NEXT:    addi r3, r3, .LCPI2_0@toc@l
171 ; CHECK-LE-P7-NEXT:    lxvd2x vs0, 0, r3
172 ; CHECK-LE-P7-NEXT:    addi r3, r1, -32
173 ; CHECK-LE-P7-NEXT:    xxswapd v3, vs0
174 ; CHECK-LE-P7-NEXT:    lxvd2x vs0, 0, r3
175 ; CHECK-LE-P7-NEXT:    xxswapd v4, vs0
176 ; CHECK-LE-P7-NEXT:    vperm v2, v4, v2, v3
177 ; CHECK-LE-P7-NEXT:    blr
179 ; CHECK-LE-P8-LABEL: test3:
180 ; CHECK-LE-P8:       # %bb.0: # %entry
181 ; CHECK-LE-P8-NEXT:    addis r3, r2, .LCPI2_0@toc@ha
182 ; CHECK-LE-P8-NEXT:    xscvdpuxws v4, f1
183 ; CHECK-LE-P8-NEXT:    addi r3, r3, .LCPI2_0@toc@l
184 ; CHECK-LE-P8-NEXT:    lxvd2x vs0, 0, r3
185 ; CHECK-LE-P8-NEXT:    xxswapd v3, vs0
186 ; CHECK-LE-P8-NEXT:    vperm v2, v4, v2, v3
187 ; CHECK-LE-P8-NEXT:    blr
189 ; CHECK-LE-P9-LABEL: test3:
190 ; CHECK-LE-P9:       # %bb.0: # %entry
191 ; CHECK-LE-P9-NEXT:    xscvdpuxws f0, f1
192 ; CHECK-LE-P9-NEXT:    xxinsertw v2, vs0, 0
193 ; CHECK-LE-P9-NEXT:    blr
195 ; CHECK-BE-P7-LABEL: test3:
196 ; CHECK-BE-P7:       # %bb.0: # %entry
197 ; CHECK-BE-P7-NEXT:    xscvdpuxws f0, f1
198 ; CHECK-BE-P7-NEXT:    addi r3, r1, -4
199 ; CHECK-BE-P7-NEXT:    stfiwx f0, 0, r3
200 ; CHECK-BE-P7-NEXT:    lwz r3, -4(r1)
201 ; CHECK-BE-P7-NEXT:    stw r3, -32(r1)
202 ; CHECK-BE-P7-NEXT:    addis r3, r2, .LCPI2_0@toc@ha
203 ; CHECK-BE-P7-NEXT:    addi r3, r3, .LCPI2_0@toc@l
204 ; CHECK-BE-P7-NEXT:    lxvw4x v3, 0, r3
205 ; CHECK-BE-P7-NEXT:    addi r3, r1, -32
206 ; CHECK-BE-P7-NEXT:    lxvw4x v4, 0, r3
207 ; CHECK-BE-P7-NEXT:    vperm v2, v2, v4, v3
208 ; CHECK-BE-P7-NEXT:    blr
210 ; CHECK-BE-P8-LABEL: test3:
211 ; CHECK-BE-P8:       # %bb.0: # %entry
212 ; CHECK-BE-P8-NEXT:    addis r3, r2, .LCPI2_0@toc@ha
213 ; CHECK-BE-P8-NEXT:    xscvdpuxws v4, f1
214 ; CHECK-BE-P8-NEXT:    addi r3, r3, .LCPI2_0@toc@l
215 ; CHECK-BE-P8-NEXT:    lxvw4x v3, 0, r3
216 ; CHECK-BE-P8-NEXT:    vperm v2, v2, v4, v3
217 ; CHECK-BE-P8-NEXT:    blr
219 ; CHECK-BE-P9-LABEL: test3:
220 ; CHECK-BE-P9:       # %bb.0: # %entry
221 ; CHECK-BE-P9-NEXT:    xscvdpuxws f0, f1
222 ; CHECK-BE-P9-NEXT:    xxinsertw v2, vs0, 12
223 ; CHECK-BE-P9-NEXT:    blr
224 entry:
225   %conv = fptoui double %b to i32
226   %vecins = insertelement <4 x i32> %a, i32 %conv, i32 3
227   ret <4 x i32> %vecins
230 define dso_local <4 x i32> @test4(<4 x i32> %a, float %b) {
231 ; CHECK-LE-P7-LABEL: test4:
232 ; CHECK-LE-P7:       # %bb.0: # %entry
233 ; CHECK-LE-P7-NEXT:    xscvdpuxws f0, f1
234 ; CHECK-LE-P7-NEXT:    addi r3, r1, -4
235 ; CHECK-LE-P7-NEXT:    stfiwx f0, 0, r3
236 ; CHECK-LE-P7-NEXT:    lwz r3, -4(r1)
237 ; CHECK-LE-P7-NEXT:    stw r3, -32(r1)
238 ; CHECK-LE-P7-NEXT:    addis r3, r2, .LCPI3_0@toc@ha
239 ; CHECK-LE-P7-NEXT:    addi r3, r3, .LCPI3_0@toc@l
240 ; CHECK-LE-P7-NEXT:    lxvd2x vs0, 0, r3
241 ; CHECK-LE-P7-NEXT:    addi r3, r1, -32
242 ; CHECK-LE-P7-NEXT:    xxswapd v3, vs0
243 ; CHECK-LE-P7-NEXT:    lxvd2x vs0, 0, r3
244 ; CHECK-LE-P7-NEXT:    xxswapd v4, vs0
245 ; CHECK-LE-P7-NEXT:    vperm v2, v4, v2, v3
246 ; CHECK-LE-P7-NEXT:    blr
248 ; CHECK-LE-P8-LABEL: test4:
249 ; CHECK-LE-P8:       # %bb.0: # %entry
250 ; CHECK-LE-P8-NEXT:    addis r3, r2, .LCPI3_0@toc@ha
251 ; CHECK-LE-P8-NEXT:    xscvdpuxws v4, f1
252 ; CHECK-LE-P8-NEXT:    addi r3, r3, .LCPI3_0@toc@l
253 ; CHECK-LE-P8-NEXT:    lxvd2x vs0, 0, r3
254 ; CHECK-LE-P8-NEXT:    xxswapd v3, vs0
255 ; CHECK-LE-P8-NEXT:    vperm v2, v4, v2, v3
256 ; CHECK-LE-P8-NEXT:    blr
258 ; CHECK-LE-P9-LABEL: test4:
259 ; CHECK-LE-P9:       # %bb.0: # %entry
260 ; CHECK-LE-P9-NEXT:    xscvdpuxws f0, f1
261 ; CHECK-LE-P9-NEXT:    xxinsertw v2, vs0, 0
262 ; CHECK-LE-P9-NEXT:    blr
264 ; CHECK-BE-P7-LABEL: test4:
265 ; CHECK-BE-P7:       # %bb.0: # %entry
266 ; CHECK-BE-P7-NEXT:    xscvdpuxws f0, f1
267 ; CHECK-BE-P7-NEXT:    addi r3, r1, -4
268 ; CHECK-BE-P7-NEXT:    stfiwx f0, 0, r3
269 ; CHECK-BE-P7-NEXT:    lwz r3, -4(r1)
270 ; CHECK-BE-P7-NEXT:    stw r3, -32(r1)
271 ; CHECK-BE-P7-NEXT:    addis r3, r2, .LCPI3_0@toc@ha
272 ; CHECK-BE-P7-NEXT:    addi r3, r3, .LCPI3_0@toc@l
273 ; CHECK-BE-P7-NEXT:    lxvw4x v3, 0, r3
274 ; CHECK-BE-P7-NEXT:    addi r3, r1, -32
275 ; CHECK-BE-P7-NEXT:    lxvw4x v4, 0, r3
276 ; CHECK-BE-P7-NEXT:    vperm v2, v2, v4, v3
277 ; CHECK-BE-P7-NEXT:    blr
279 ; CHECK-BE-P8-LABEL: test4:
280 ; CHECK-BE-P8:       # %bb.0: # %entry
281 ; CHECK-BE-P8-NEXT:    addis r3, r2, .LCPI3_0@toc@ha
282 ; CHECK-BE-P8-NEXT:    xscvdpuxws v4, f1
283 ; CHECK-BE-P8-NEXT:    addi r3, r3, .LCPI3_0@toc@l
284 ; CHECK-BE-P8-NEXT:    lxvw4x v3, 0, r3
285 ; CHECK-BE-P8-NEXT:    vperm v2, v2, v4, v3
286 ; CHECK-BE-P8-NEXT:    blr
288 ; CHECK-BE-P9-LABEL: test4:
289 ; CHECK-BE-P9:       # %bb.0: # %entry
290 ; CHECK-BE-P9-NEXT:    xscvdpuxws f0, f1
291 ; CHECK-BE-P9-NEXT:    xxinsertw v2, vs0, 12
292 ; CHECK-BE-P9-NEXT:    blr
293 entry:
294   %conv = fptoui float %b to i32
295   %vecins = insertelement <4 x i32> %a, i32 %conv, i32 3
296   ret <4 x i32> %vecins