1 ; RUN: llc < %s -mtriple=i686-pc-win32 -mattr=+sse2 | FileCheck %s --check-prefix=CHECK --check-prefix=SSE2
2 ; RUN: llc < %s -mtriple=i686-pc-win32 -mattr=+sse2,+avx | FileCheck %s --check-prefix=CHECK --check-prefix=AVX
3 ; RUN: llc < %s -mtriple=i686-pc-win32 -mattr=+sse2,+avx,+avx512f | FileCheck %s --check-prefix=CHECK --check-prefix=AVX512
5 ; While we don't support varargs with fastcall, we do support forwarding.
7 @asdf = internal constant [4 x i8] c"asdf"
9 declare void @puts(i8*)
11 define i32 @call_fast_thunk() {
12 %r = call x86_fastcallcc i32 (...) @fast_thunk(i32 inreg 1, i32 inreg 2, i32 3)
16 define x86_fastcallcc i32 @fast_thunk(...) {
17 call void @puts(i8* getelementptr ([4 x i8], [4 x i8]* @asdf, i32 0, i32 0))
18 %r = musttail call x86_fastcallcc i32 (...) bitcast (i32 (i32, i32, i32)* @fast_target to i32 (...)*) (...)
22 ; Check that we spill and fill around the call to puts.
24 ; CHECK-LABEL: @fast_thunk@0:
25 ; CHECK-DAG: movl %ecx, {{.*}}
26 ; CHECK-DAG: movl %edx, {{.*}}
28 ; CHECK-DAG: movl {{.*}}, %ecx
29 ; CHECK-DAG: movl {{.*}}, %edx
30 ; CHECK: jmp @fast_target@12
32 define x86_fastcallcc i32 @fast_target(i32 inreg %a, i32 inreg %b, i32 %c) {
38 ; Repeat the test for vectorcall, which has XMM registers.
40 define i32 @call_vector_thunk() {
41 %r = call x86_vectorcallcc i32 (...) @vector_thunk(i32 inreg 1, i32 inreg 2, i32 3)
45 define x86_vectorcallcc i32 @vector_thunk(...) {
46 call void @puts(i8* getelementptr ([4 x i8], [4 x i8]* @asdf, i32 0, i32 0))
47 %r = musttail call x86_vectorcallcc i32 (...) bitcast (i32 (i32, i32, i32)* @vector_target to i32 (...)*) (...)
51 ; Check that we spill and fill SSE registers around the call to puts.
53 ; CHECK-LABEL: vector_thunk@@0:
54 ; CHECK-DAG: movl %ecx, {{.*}}
55 ; CHECK-DAG: movl %edx, {{.*}}
57 ; SSE2-DAG: movups %xmm0, {{.*}}
58 ; SSE2-DAG: movups %xmm1, {{.*}}
59 ; SSE2-DAG: movups %xmm2, {{.*}}
60 ; SSE2-DAG: movups %xmm3, {{.*}}
61 ; SSE2-DAG: movups %xmm4, {{.*}}
62 ; SSE2-DAG: movups %xmm5, {{.*}}
64 ; AVX-DAG: vmovups %ymm0, {{.*}}
65 ; AVX-DAG: vmovups %ymm1, {{.*}}
66 ; AVX-DAG: vmovups %ymm2, {{.*}}
67 ; AVX-DAG: vmovups %ymm3, {{.*}}
68 ; AVX-DAG: vmovups %ymm4, {{.*}}
69 ; AVX-DAG: vmovups %ymm5, {{.*}}
71 ; AVX512-DAG: vmovups %zmm0, {{.*}}
72 ; AVX512-DAG: vmovups %zmm1, {{.*}}
73 ; AVX512-DAG: vmovups %zmm2, {{.*}}
74 ; AVX512-DAG: vmovups %zmm3, {{.*}}
75 ; AVX512-DAG: vmovups %zmm4, {{.*}}
76 ; AVX512-DAG: vmovups %zmm5, {{.*}}
80 ; SSE2-DAG: movups {{.*}}, %xmm0
81 ; SSE2-DAG: movups {{.*}}, %xmm1
82 ; SSE2-DAG: movups {{.*}}, %xmm2
83 ; SSE2-DAG: movups {{.*}}, %xmm3
84 ; SSE2-DAG: movups {{.*}}, %xmm4
85 ; SSE2-DAG: movups {{.*}}, %xmm5
87 ; AVX-DAG: vmovups {{.*}}, %ymm0
88 ; AVX-DAG: vmovups {{.*}}, %ymm1
89 ; AVX-DAG: vmovups {{.*}}, %ymm2
90 ; AVX-DAG: vmovups {{.*}}, %ymm3
91 ; AVX-DAG: vmovups {{.*}}, %ymm4
92 ; AVX-DAG: vmovups {{.*}}, %ymm5
94 ; AVX512-DAG: vmovups {{.*}}, %zmm0
95 ; AVX512-DAG: vmovups {{.*}}, %zmm1
96 ; AVX512-DAG: vmovups {{.*}}, %zmm2
97 ; AVX512-DAG: vmovups {{.*}}, %zmm3
98 ; AVX512-DAG: vmovups {{.*}}, %zmm4
99 ; AVX512-DAG: vmovups {{.*}}, %zmm5
101 ; CHECK-DAG: movl {{.*}}, %ecx
102 ; CHECK-DAG: movl {{.*}}, %edx
103 ; CHECK: jmp vector_target@@12
105 define x86_vectorcallcc i32 @vector_target(i32 inreg %a, i32 inreg %b, i32 %c) {
107 %a1 = add i32 %a0, %c