1 ; RUN: llc < %s -mtriple x86_64-unknown-linux-gnu -mattr +avx | FileCheck %s
2 ; RUN: llc < %s -mtriple x86_64-unknown-linux-gnu -mattr +avx512f | FileCheck %s
4 define <4 x float> @testxmm_1(<4 x float> %_xmm0, i64 %_l) {
5 ; CHECK: vmovhlps %xmm1, %xmm0, %xmm0
7 %0 = tail call <4 x float> asm "vmovhlps $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l, <4 x float> %_xmm0)
11 define <4 x float> @testxmm_2(<4 x float> %_xmm0, i64 %_l) {
12 ; CHECK: movapd %xmm0, %xmm0
14 %0 = tail call <4 x float> asm "movapd $1, $0", "=v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l)
18 define <4 x float> @testxmm_3(<4 x float> %_xmm0, i64 %_l) {
19 ; CHECK: vmovapd %xmm0, %xmm0
21 %0 = tail call <4 x float> asm "vmovapd $1, $0", "=v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l)
25 define <4 x float> @testxmm_4(<4 x float> %_xmm0, i64 %_l) {
26 ; CHECK: vmpsadbw $0, %xmm1, %xmm0, %xmm0
28 %0 = tail call <4 x float> asm "vmpsadbw $$0, $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l, <4 x float> %_xmm0)
32 define <4 x float> @testxmm_5(<4 x float> %_xmm0, i64 %_l) {
33 ; CHECK: vminpd %xmm0, %xmm0, %xmm0
35 %0 = tail call <4 x float> asm "vminpd $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l, i64 %_l)
39 define i64 @testxmm_6(i64 returned %_l) {
40 ; CHECK: vmovd %xmm0, %eax
42 tail call void asm sideeffect "vmovd $0, %eax", "v,~{dirflag},~{fpsr},~{flags}"(i64 %_l)
46 define <4 x float> @testxmm_7(<4 x float> returned %_xmm0) {
47 ; CHECK: vmovmskps %xmm0, %eax
49 tail call void asm sideeffect "vmovmskps $0, %rax", "v,~{dirflag},~{fpsr},~{flags}"(<4 x float> %_xmm0)
50 ret <4 x float> %_xmm0
53 define i64 @testxmm_8(<4 x float> %_xmm0, i64 %_l) {
54 ; CHECK: vmulsd %xmm1, %xmm0, %xmm0
56 %0 = tail call i64 asm "vmulsd $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l, <4 x float> %_xmm0)
60 define <4 x float> @testxmm_9(<4 x float> %_xmm0, i64 %_l) {
61 ; CHECK: vorpd %xmm1, %xmm0, %xmm0
63 %0 = tail call <4 x float> asm "vorpd $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l, <4 x float> %_xmm0)
67 define <4 x float> @testxmm_10(<4 x float> %_xmm0, i64 %_l) {
68 ; CHECK: pabsb %xmm0, %xmm0
70 %0 = tail call <4 x float> asm "pabsb $1, $0", "=v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l)
74 define <4 x float> @testxmm_11(<4 x float> %_xmm0, i64 %_l) {
75 ; CHECK: vpabsd %xmm0, %xmm0
77 %0 = tail call <4 x float> asm "vpabsd $1, $0", "=v,v,~{dirflag},~{fpsr},~{flags}"(i64 %_l)
81 define <8 x float> @testymm_1(<8 x float> %_ymm0, <8 x float> %_ymm1) {
82 ; CHECK: vmovsldup %ymm0, %ymm0
84 %0 = tail call <8 x float> asm "vmovsldup $1, $0", "=v,v,~{dirflag},~{fpsr},~{flags}"(<8 x float> %_ymm0)
88 define <8 x float> @testymm_2(<8 x float> %_ymm0, <8 x float> %_ymm1) {
89 ; CHECK: vmovapd %ymm1, %ymm0
91 %0 = tail call <8 x float> asm "vmovapd $1, $0", "=v,v,~{dirflag},~{fpsr},~{flags}"(<8 x float> %_ymm1)
95 define <8 x float> @testymm_3(<8 x float> %_ymm0, <8 x float> %_ymm1) {
96 ; CHECK: vminpd %ymm1, %ymm0, %ymm0
98 %0 = tail call <8 x float> asm "vminpd $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(<8 x float> %_ymm1, <8 x float> %_ymm0)
102 define <8 x float> @testymm_4(<8 x float> %_ymm0, <8 x float> %_ymm1) {
103 ; CHECK: vorpd %ymm1, %ymm0, %ymm0
105 %0 = tail call <8 x float> asm "vorpd $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(<8 x float> %_ymm1, <8 x float> %_ymm0)
109 define <8 x float> @testymm(<8 x float> %_ymm0, <8 x float> %_ymm1) {
110 ; CHECK: vmulps %ymm1, %ymm0, %ymm0
112 %0 = tail call <8 x float> asm "vmulps $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(<8 x float> %_ymm1, <8 x float> %_ymm0)
116 define <8 x float> @testymm_6(<8 x float> %_ymm0, <8 x float> %_ymm1) {
117 ; CHECK: vmulpd %ymm1, %ymm0, %ymm0
119 %0 = tail call <8 x float> asm "vmulpd $1, $2, $0", "=v,v,v,~{dirflag},~{fpsr},~{flags}"(<8 x float> %_ymm1, <8 x float> %_ymm0)
123 define <8 x float> @testymm_7(<8 x float> %_ymm0, <8 x float> %_ymm1) {
124 ; CHECK: vmovups %ymm1, %ymm0
126 %0 = tail call <8 x float> asm "vmovups $1, $0", "=v,v,~{dirflag},~{fpsr},~{flags}"(<8 x float> %_ymm1)
130 define <8 x float> @testymm_8(<8 x float> %_ymm0, <8 x float> %_ymm1) {
131 ; CHECK: vmovupd %ymm1, %ymm0
133 %0 = tail call <8 x float> asm "vmovupd $1, $0", "=v,v,~{dirflag},~{fpsr},~{flags}"(<8 x float> %_ymm1)