1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2 ; RUN: llc < %s -mcpu=pentium2 -mtriple=i686-apple-darwin8.8.0 | FileCheck %s --check-prefix=X86
3 ; RUN: llc < %s -mcpu=pentium3 -mtriple=i686-apple-darwin8.8.0 | FileCheck %s --check-prefix=XMM
4 ; RUN: llc < %s -mcpu=bdver1 -mtriple=i686-apple-darwin8.8.0 | FileCheck %s --check-prefix=YMM
6 %struct.x = type { i16, i16 }
8 define void @t() nounwind {
10 ; X86: ## %bb.0: ## %entry
11 ; X86-NEXT: subl $44, %esp
12 ; X86-NEXT: movl $0, {{[0-9]+}}(%esp)
13 ; X86-NEXT: movl $0, {{[0-9]+}}(%esp)
14 ; X86-NEXT: movl $0, {{[0-9]+}}(%esp)
15 ; X86-NEXT: movl $0, {{[0-9]+}}(%esp)
16 ; X86-NEXT: movl $0, {{[0-9]+}}(%esp)
17 ; X86-NEXT: movl $0, {{[0-9]+}}(%esp)
18 ; X86-NEXT: movl $0, {{[0-9]+}}(%esp)
19 ; X86-NEXT: movl $0, {{[0-9]+}}(%esp)
20 ; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
21 ; X86-NEXT: movl %eax, (%esp)
22 ; X86-NEXT: calll _foo
23 ; X86-NEXT: addl $44, %esp
27 ; XMM: ## %bb.0: ## %entry
28 ; XMM-NEXT: subl $60, %esp
29 ; XMM-NEXT: xorps %xmm0, %xmm0
30 ; XMM-NEXT: movaps %xmm0, {{[0-9]+}}(%esp)
31 ; XMM-NEXT: movaps %xmm0, {{[0-9]+}}(%esp)
32 ; XMM-NEXT: leal {{[0-9]+}}(%esp), %eax
33 ; XMM-NEXT: movl %eax, (%esp)
34 ; XMM-NEXT: calll _foo
35 ; XMM-NEXT: addl $60, %esp
39 ; YMM: ## %bb.0: ## %entry
40 ; YMM-NEXT: subl $60, %esp
41 ; YMM-NEXT: leal {{[0-9]+}}(%esp), %eax
42 ; YMM-NEXT: vxorps %xmm0, %xmm0, %xmm0
43 ; YMM-NEXT: vmovups %ymm0, {{[0-9]+}}(%esp)
44 ; YMM-NEXT: movl %eax, (%esp)
45 ; YMM-NEXT: vzeroupper
46 ; YMM-NEXT: calll _foo
47 ; YMM-NEXT: addl $60, %esp
50 %up_mvd = alloca [8 x %struct.x] ; <ptr> [#uses=2]
51 %up_mvd116 = getelementptr [8 x %struct.x], ptr %up_mvd, i32 0, i32 0 ; <ptr> [#uses=1]
53 call void @llvm.memset.p0.i64(ptr align 8 %up_mvd, i8 0, i64 32, i1 false)
54 call void @foo( ptr %up_mvd116 ) nounwind
58 declare void @foo(ptr)
60 declare void @llvm.memset.p0.i64(ptr nocapture, i8, i64, i1) nounwind
62 ; Ensure that alignment of '0' in an @llvm.memset intrinsic results in
63 ; unaligned loads and stores.
64 define void @PR15348(ptr %a) {
67 ; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
68 ; X86-NEXT: movb $0, 16(%eax)
69 ; X86-NEXT: movl $0, 12(%eax)
70 ; X86-NEXT: movl $0, 8(%eax)
71 ; X86-NEXT: movl $0, 4(%eax)
72 ; X86-NEXT: movl $0, (%eax)
77 ; XMM-NEXT: movl {{[0-9]+}}(%esp), %eax
78 ; XMM-NEXT: movb $0, 16(%eax)
79 ; XMM-NEXT: movl $0, 12(%eax)
80 ; XMM-NEXT: movl $0, 8(%eax)
81 ; XMM-NEXT: movl $0, 4(%eax)
82 ; XMM-NEXT: movl $0, (%eax)
87 ; YMM-NEXT: movl {{[0-9]+}}(%esp), %eax
88 ; YMM-NEXT: vxorps %xmm0, %xmm0, %xmm0
89 ; YMM-NEXT: vmovups %xmm0, (%eax)
90 ; YMM-NEXT: movb $0, 16(%eax)
92 call void @llvm.memset.p0.i64(ptr %a, i8 0, i64 17, i1 false)
96 declare void @llvm.memset.p0.i32(ptr nocapture writeonly, i8, i32, i1 immarg)
98 define void @PR83077(ptr %a) {
101 ; X86-NEXT: pushl %edi
102 ; X86-NEXT: .cfi_def_cfa_offset 8
103 ; X86-NEXT: .cfi_offset %edi, -8
104 ; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
105 ; X86-NEXT: movl $-1, %eax
106 ; X86-NEXT: movl $22, %ecx
107 ; X86-NEXT: movl %edx, %edi
108 ; X86-NEXT: rep;stosl %eax, %es:(%edi)
109 ; X86-NEXT: movw $-1, 88(%edx)
110 ; X86-NEXT: popl %edi
113 ; XMM-LABEL: PR83077:
115 ; XMM-NEXT: pushl %edi
116 ; XMM-NEXT: .cfi_def_cfa_offset 8
117 ; XMM-NEXT: .cfi_offset %edi, -8
118 ; XMM-NEXT: movl {{[0-9]+}}(%esp), %edx
119 ; XMM-NEXT: movl $-1, %eax
120 ; XMM-NEXT: movl $22, %ecx
121 ; XMM-NEXT: movl %edx, %edi
122 ; XMM-NEXT: rep;stosl %eax, %es:(%edi)
123 ; XMM-NEXT: movw $-1, 88(%edx)
124 ; XMM-NEXT: popl %edi
127 ; YMM-LABEL: PR83077:
129 ; YMM-NEXT: movl {{[0-9]+}}(%esp), %eax
130 ; YMM-NEXT: vxorps %xmm0, %xmm0, %xmm0
131 ; YMM-NEXT: vcmptrueps %ymm0, %ymm0, %ymm0
132 ; YMM-NEXT: vmovups %ymm0, 58(%eax)
133 ; YMM-NEXT: vmovups %ymm0, 32(%eax)
134 ; YMM-NEXT: vmovups %ymm0, (%eax)
135 ; YMM-NEXT: vzeroupper
137 call void @llvm.memset.p0.i32(ptr noundef nonnull align 4 dereferenceable(90) %a, i8 -1, i32 90, i1 false)