1 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu -mcpu=pwr8 < %s | FileCheck %s
2 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr8 < %s | FileCheck %s
4 @vda = common global <2 x double> zeroinitializer, align 16
5 @vdb = common global <2 x double> zeroinitializer, align 16
6 @vdr = common global <2 x double> zeroinitializer, align 16
7 @vfa = common global <4 x float> zeroinitializer, align 16
8 @vfb = common global <4 x float> zeroinitializer, align 16
9 @vfr = common global <4 x float> zeroinitializer, align 16
10 @vbllr = common global <2 x i64> zeroinitializer, align 16
11 @vbir = common global <4 x i32> zeroinitializer, align 16
12 @vblla = common global <2 x i64> zeroinitializer, align 16
13 @vbllb = common global <2 x i64> zeroinitializer, align 16
14 @vbia = common global <4 x i32> zeroinitializer, align 16
15 @vbib = common global <4 x i32> zeroinitializer, align 16
17 ; Function Attrs: nounwind
18 define void @test1() {
20 %0 = load <2 x double>, ptr @vda, align 16
21 %1 = load <2 x double>, ptr @vdb, align 16
22 %2 = call <2 x double> @llvm.ppc.vsx.xvdivdp(<2 x double> %0, <2 x double> %1)
23 store <2 x double> %2, ptr @vdr, align 16
26 ; CHECK: xvdivdp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}
29 ; Function Attrs: nounwind
30 define void @test2() {
32 %0 = load <4 x float>, ptr @vfa, align 16
33 %1 = load <4 x float>, ptr @vfb, align 16
34 %2 = call <4 x float> @llvm.ppc.vsx.xvdivsp(<4 x float> %0, <4 x float> %1)
35 store <4 x float> %2, ptr @vfr, align 16
38 ; CHECK: xvdivsp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}
41 ; Function Attrs: nounwind
42 define void @test3() {
44 %0 = load <2 x double>, ptr @vda, align 16
45 %1 = load <2 x double>, ptr @vda, align 16
46 %2 = call <2 x double> @llvm.ceil.v2f64(<2 x double> %1)
47 store <2 x double> %2, ptr @vdr, align 16
50 ; CHECK: xvrdpip {{[0-9]+}}, {{[0-9]+}}
53 ; Function Attrs: nounwind
54 define void @test4() {
56 %0 = load <4 x float>, ptr @vfa, align 16
57 %1 = load <4 x float>, ptr @vfa, align 16
58 %2 = call <4 x float> @llvm.ceil.v4f32(<4 x float> %1)
59 store <4 x float> %2, ptr @vfr, align 16
62 ; CHECK: xvrspip {{[0-9]+}}, {{[0-9]+}}
65 ; Function Attrs: nounwind
66 define void @test5() {
68 %0 = load <2 x double>, ptr @vda, align 16
69 %1 = load <2 x double>, ptr @vdb, align 16
70 %2 = call <2 x i64> @llvm.ppc.vsx.xvcmpeqdp(<2 x double> %0, <2 x double> %1)
71 store <2 x i64> %2, ptr @vbllr, align 16
74 ; CHECK: xvcmpeqdp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}
77 ; Function Attrs: nounwind
78 define void @test6() {
80 %0 = load <4 x float>, ptr @vfa, align 16
81 %1 = load <4 x float>, ptr @vfb, align 16
82 %2 = call <4 x i32> @llvm.ppc.vsx.xvcmpeqsp(<4 x float> %0, <4 x float> %1)
83 store <4 x i32> %2, ptr @vbir, align 16
86 ; CHECK: xvcmpeqsp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}
89 ; Function Attrs: nounwind
90 define void @test7() {
92 %0 = load <2 x double>, ptr @vda, align 16
93 %1 = load <2 x double>, ptr @vdb, align 16
94 %2 = call <2 x i64> @llvm.ppc.vsx.xvcmpgedp(<2 x double> %0, <2 x double> %1)
95 store <2 x i64> %2, ptr @vbllr, align 16
98 ; CHECK: xvcmpgedp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}
101 ; Function Attrs: nounwind
102 define void @test8() {
104 %0 = load <4 x float>, ptr @vfa, align 16
105 %1 = load <4 x float>, ptr @vfb, align 16
106 %2 = call <4 x i32> @llvm.ppc.vsx.xvcmpgesp(<4 x float> %0, <4 x float> %1)
107 store <4 x i32> %2, ptr @vbir, align 16
109 ; CHECK-LABEL: @test8
110 ; CHECK: xvcmpgesp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}
113 ; Function Attrs: nounwind
114 define void @test9() {
116 %0 = load <2 x double>, ptr @vda, align 16
117 %1 = load <2 x double>, ptr @vdb, align 16
118 %2 = call <2 x i64> @llvm.ppc.vsx.xvcmpgtdp(<2 x double> %0, <2 x double> %1)
119 store <2 x i64> %2, ptr @vbllr, align 16
121 ; CHECK-LABEL: @test9
122 ; CHECK: xvcmpgtdp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}
125 ; Function Attrs: nounwind
126 define void @test10() {
128 %0 = load <4 x float>, ptr @vfa, align 16
129 %1 = load <4 x float>, ptr @vfb, align 16
130 %2 = call <4 x i32> @llvm.ppc.vsx.xvcmpgtsp(<4 x float> %0, <4 x float> %1)
131 store <4 x i32> %2, ptr @vbir, align 16
133 ; CHECK-LABEL: @test10
134 ; CHECK: xvcmpgtsp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}
137 ; Function Attrs: nounwind
138 define <4 x float> @emit_xvresp(<4 x float> %a) {
140 %a.addr = alloca <4 x float>, align 16
141 store <4 x float> %a, ptr %a.addr, align 16
142 %0 = load <4 x float>, ptr %a.addr, align 16
143 %1 = call <4 x float> @llvm.ppc.vsx.xvresp(<4 x float> %0)
145 ; CHECK-LABEL: @emit_xvresp
146 ; CHECK: xvresp {{[0-9]+}}, {{[0-9]+}}
149 ; Function Attrs: nounwind
150 define <2 x double> @emit_xvredp(<2 x double> %a) {
152 %a.addr = alloca <2 x double>, align 16
153 store <2 x double> %a, ptr %a.addr, align 16
154 %0 = load <2 x double>, ptr %a.addr, align 16
155 %1 = call <2 x double> @llvm.ppc.vsx.xvredp(<2 x double> %0)
157 ; CHECK-LABEL: @emit_xvredp
158 ; CHECK: xvredp {{[0-9]+}}, {{[0-9]+}}
161 ; Function Attrs: nounwind readnone
162 define <4 x i32> @emit_xvcvdpsxws(<2 x double> %a) {
164 %0 = tail call <4 x i32> @llvm.ppc.vsx.xvcvdpsxws(<2 x double> %a)
166 ; CHECK-LABEL: @emit_xvcvdpsxws
167 ; CHECK: xvcvdpsxws 34, 34
170 ; Function Attrs: nounwind readnone
171 define <4 x i32> @emit_xvcvdpuxws(<2 x double> %a) {
173 %0 = tail call <4 x i32> @llvm.ppc.vsx.xvcvdpuxws(<2 x double> %a)
175 ; CHECK-LABEL: @emit_xvcvdpuxws
176 ; CHECK: xvcvdpuxws 34, 34
179 ; Function Attrs: nounwind readnone
180 define <2 x double> @emit_xvcvsxwdp(<4 x i32> %a) {
182 %0 = tail call <2 x double> @llvm.ppc.vsx.xvcvsxwdp(<4 x i32> %a)
184 ; CHECK-LABEL: @emit_xvcvsxwdp
185 ; CHECK: xvcvsxwdp 34, 34
188 ; Function Attrs: nounwind readnone
189 define <2 x double> @emit_xvcvuxwdp(<4 x i32> %a) {
191 %0 = tail call <2 x double> @llvm.ppc.vsx.xvcvuxwdp(<4 x i32> %a)
193 ; CHECK-LABEL: @emit_xvcvuxwdp
194 ; CHECK: xvcvuxwdp 34, 34
197 ; Function Attrs: nounwind readnone
198 define <2 x double> @emit_xvcvspdp(<4 x float> %a) {
200 %0 = tail call <2 x double> @llvm.ppc.vsx.xvcvspdp(<4 x float> %a)
202 ; CHECK-LABEL: @emit_xvcvspdp
203 ; CHECK: xvcvspdp 34, 34
206 ; Function Attrs: nounwind readnone
207 define <4 x float> @emit_xvcvsxdsp(<2 x i64> %a) {
209 %0 = tail call <4 x float> @llvm.ppc.vsx.xvcvsxdsp(<2 x i64> %a)
211 ; CHECK-LABEL: @emit_xvcvsxdsp
212 ; CHECK: xvcvsxdsp 34, 34
215 ; Function Attrs: nounwind readnone
216 define <4 x float> @emit_xvcvuxdsp(<2 x i64> %a) {
218 %0 = tail call <4 x float> @llvm.ppc.vsx.xvcvuxdsp(<2 x i64> %a)
220 ; CHECK-LABEL: @emit_xvcvuxdsp
221 ; CHECK: xvcvuxdsp 34, 34
224 ; Function Attrs: nounwind readnone
225 define <4 x float> @emit_xvcvdpsp(<2 x double> %a) {
227 %0 = tail call <4 x float> @llvm.ppc.vsx.xvcvdpsp(<2 x double> %a)
229 ; CHECK-LABEL: @emit_xvcvdpsp
230 ; CHECK: xvcvdpsp 34, 34
233 define dso_local <2 x i64> @emit_xvcvspsxds(<4 x float> %a) local_unnamed_addr #0 {
235 %0 = tail call <2 x i64> @llvm.ppc.vsx.xvcvspsxds(<4 x float> %a)
237 ; CHECK-LABEL: @emit_xvcvspsxds
238 ; CHECK: xvcvspsxds 34, 34
241 define dso_local <2 x i64> @emit_xvcvspuxds(<4 x float> %a) local_unnamed_addr #0 {
243 %0 = tail call <2 x i64> @llvm.ppc.vsx.xvcvspuxds(<4 x float> %a)
245 ; CHECK-LABEL: @emit_xvcvspuxds
246 ; CHECK: xvcvspuxds 34, 34
249 ; Function Attrs: nounwind readnone
250 declare <4 x float> @llvm.ppc.vsx.xvresp(<4 x float>)
252 ; Function Attrs: nounwind readnone
253 declare <2 x double> @llvm.ppc.vsx.xvredp(<2 x double>)
255 ; Function Attrs: nounwind readnone
256 declare <2 x double> @llvm.ceil.v2f64(<2 x double>)
258 ; Function Attrs: nounwind readnone
259 declare <4 x float> @llvm.ceil.v4f32(<4 x float>)
261 ; Function Attrs: nounwind readnone
262 declare <2 x double> @llvm.ppc.vsx.xvdivdp(<2 x double>, <2 x double>)
264 ; Function Attrs: nounwind readnone
265 declare <4 x float> @llvm.ppc.vsx.xvdivsp(<4 x float>, <4 x float>)
267 ; Function Attrs: nounwind readnone
268 declare <2 x i64> @llvm.ppc.vsx.xvcmpeqdp(<2 x double>, <2 x double>)
270 ; Function Attrs: nounwind readnone
271 declare <4 x i32> @llvm.ppc.vsx.xvcmpeqsp(<4 x float>, <4 x float>)
273 ; Function Attrs: nounwind readnone
274 declare <2 x i64> @llvm.ppc.vsx.xvcmpgedp(<2 x double>, <2 x double>)
276 ; Function Attrs: nounwind readnone
277 declare <4 x i32> @llvm.ppc.vsx.xvcmpgesp(<4 x float>, <4 x float>)
279 ; Function Attrs: nounwind readnone
280 declare <2 x i64> @llvm.ppc.vsx.xvcmpgtdp(<2 x double>, <2 x double>)
282 ; Function Attrs: nounwind readnone
283 declare <4 x i32> @llvm.ppc.vsx.xvcmpgtsp(<4 x float>, <4 x float>)
284 declare <4 x float> @llvm.ppc.vsx.xvcvdpsp(<2 x double>) #1
285 declare <4 x i32> @llvm.ppc.vsx.xvcvdpsxws(<2 x double>) #1
286 declare <4 x i32> @llvm.ppc.vsx.xvcvdpuxws(<2 x double>) #1
287 declare <2 x double> @llvm.ppc.vsx.xvcvsxwdp(<4 x i32>) #1
288 declare <2 x double> @llvm.ppc.vsx.xvcvuxwdp(<4 x i32>) #1
289 declare <2 x double> @llvm.ppc.vsx.xvcvspdp(<4 x float>) #1
290 declare <4 x float> @llvm.ppc.vsx.xvcvsxdsp(<2 x i64>) #1
291 declare <4 x float> @llvm.ppc.vsx.xvcvuxdsp(<2 x i64>) #1
292 declare <2 x i64> @llvm.ppc.vsx.xvcvspsxds(<4 x float>) #1
293 declare <2 x i64> @llvm.ppc.vsx.xvcvspuxds(<4 x float>) #1