1 ; RUN: llc < %s -mtriple=ve -mattr=+vpu | FileCheck %s
3 ;;; Test vector floating square root intrinsic instructions
6 ;;; We test VFSQRT*vl and VFSQRT*vl_v instructions.
8 ; Function Attrs: nounwind readnone
9 define fastcc <256 x double> @vfsqrtd_vvl(<256 x double> %0) {
10 ; CHECK-LABEL: vfsqrtd_vvl:
12 ; CHECK-NEXT: lea %s0, 256
14 ; CHECK-NEXT: vfsqrt.d %v0, %v0
15 ; CHECK-NEXT: b.l.t (, %s10)
16 %2 = tail call fast <256 x double> @llvm.ve.vl.vfsqrtd.vvl(<256 x double> %0, i32 256)
20 ; Function Attrs: nounwind readnone
21 declare <256 x double> @llvm.ve.vl.vfsqrtd.vvl(<256 x double>, i32)
23 ; Function Attrs: nounwind readnone
24 define fastcc <256 x double> @vfsqrtd_vvvl(<256 x double> %0, <256 x double> %1) {
25 ; CHECK-LABEL: vfsqrtd_vvvl:
27 ; CHECK-NEXT: lea %s0, 128
29 ; CHECK-NEXT: vfsqrt.d %v1, %v0
30 ; CHECK-NEXT: lea %s16, 256
31 ; CHECK-NEXT: lvl %s16
32 ; CHECK-NEXT: vor %v0, (0)1, %v1
33 ; CHECK-NEXT: b.l.t (, %s10)
34 %3 = tail call fast <256 x double> @llvm.ve.vl.vfsqrtd.vvvl(<256 x double> %0, <256 x double> %1, i32 128)
38 ; Function Attrs: nounwind readnone
39 declare <256 x double> @llvm.ve.vl.vfsqrtd.vvvl(<256 x double>, <256 x double>, i32)
41 ; Function Attrs: nounwind readnone
42 define fastcc <256 x double> @vfsqrts_vvl(<256 x double> %0) {
43 ; CHECK-LABEL: vfsqrts_vvl:
45 ; CHECK-NEXT: lea %s0, 256
47 ; CHECK-NEXT: vfsqrt.s %v0, %v0
48 ; CHECK-NEXT: b.l.t (, %s10)
49 %2 = tail call fast <256 x double> @llvm.ve.vl.vfsqrts.vvl(<256 x double> %0, i32 256)
53 ; Function Attrs: nounwind readnone
54 declare <256 x double> @llvm.ve.vl.vfsqrts.vvl(<256 x double>, i32)
56 ; Function Attrs: nounwind readnone
57 define fastcc <256 x double> @vfsqrts_vvvl(<256 x double> %0, <256 x double> %1) {
58 ; CHECK-LABEL: vfsqrts_vvvl:
60 ; CHECK-NEXT: lea %s0, 128
62 ; CHECK-NEXT: vfsqrt.s %v1, %v0
63 ; CHECK-NEXT: lea %s16, 256
64 ; CHECK-NEXT: lvl %s16
65 ; CHECK-NEXT: vor %v0, (0)1, %v1
66 ; CHECK-NEXT: b.l.t (, %s10)
67 %3 = tail call fast <256 x double> @llvm.ve.vl.vfsqrts.vvvl(<256 x double> %0, <256 x double> %1, i32 128)
71 ; Function Attrs: nounwind readnone
72 declare <256 x double> @llvm.ve.vl.vfsqrts.vvvl(<256 x double>, <256 x double>, i32)