Merge "Add save/restore xmm registers in x86 assembly code"
[libvpx.git] / vpx_ports / x86_abi_support.asm
blob60dff4916845a5d4d58c67933c3ce7daefea86c0
2 ; Copyright (c) 2010 The WebM project authors. All Rights Reserved.
4 ; Use of this source code is governed by a BSD-style license
5 ; that can be found in the LICENSE file in the root of the source
6 ; tree. An additional intellectual property rights grant can be found
7 ; in the file PATENTS. All contributing project authors may
8 ; be found in the AUTHORS file in the root of the source tree.
12 %include "vpx_config.asm"
14 ; 32/64 bit compatibility macros
16 ; In general, we make the source use 64 bit syntax, then twiddle with it using
17 ; the preprocessor to get the 32 bit syntax on 32 bit platforms.
19 %ifidn __OUTPUT_FORMAT__,elf32
20 %define ABI_IS_32BIT 1
21 %elifidn __OUTPUT_FORMAT__,macho32
22 %define ABI_IS_32BIT 1
23 %elifidn __OUTPUT_FORMAT__,win32
24 %define ABI_IS_32BIT 1
25 %else
26 %define ABI_IS_32BIT 0
27 %endif
29 %if ABI_IS_32BIT
30 %define rax eax
31 %define rbx ebx
32 %define rcx ecx
33 %define rdx edx
34 %define rsi esi
35 %define rdi edi
36 %define rsp esp
37 %define rbp ebp
38 %define movsxd mov
39 %macro movq 2
40 %ifidn %1,eax
41 movd %1,%2
42 %elifidn %2,eax
43 movd %1,%2
44 %elifidn %1,ebx
45 movd %1,%2
46 %elifidn %2,ebx
47 movd %1,%2
48 %elifidn %1,ecx
49 movd %1,%2
50 %elifidn %2,ecx
51 movd %1,%2
52 %elifidn %1,edx
53 movd %1,%2
54 %elifidn %2,edx
55 movd %1,%2
56 %elifidn %1,esi
57 movd %1,%2
58 %elifidn %2,esi
59 movd %1,%2
60 %elifidn %1,edi
61 movd %1,%2
62 %elifidn %2,edi
63 movd %1,%2
64 %elifidn %1,esp
65 movd %1,%2
66 %elifidn %2,esp
67 movd %1,%2
68 %elifidn %1,ebp
69 movd %1,%2
70 %elifidn %2,ebp
71 movd %1,%2
72 %else
73 movq %1,%2
74 %endif
75 %endmacro
76 %endif
79 ; sym()
80 ; Return the proper symbol name for the target ABI.
82 ; Certain ABIs, notably MS COFF and Darwin MACH-O, require that symbols
83 ; with C linkage be prefixed with an underscore.
85 %ifidn __OUTPUT_FORMAT__,elf32
86 %define sym(x) x
87 %elifidn __OUTPUT_FORMAT__,elf64
88 %define sym(x) x
89 %elifidn __OUTPUT_FORMAT__,x64
90 %define sym(x) x
91 %else
92 %define sym(x) _ %+ x
93 %endif
95 ; arg()
96 ; Return the address specification of the given argument
98 %if ABI_IS_32BIT
99 %define arg(x) [ebp+8+4*x]
100 %else
101 ; 64 bit ABI passes arguments in registers. This is a workaround to get up
102 ; and running quickly. Relies on SHADOW_ARGS_TO_STACK
103 %ifidn __OUTPUT_FORMAT__,x64
104 %define arg(x) [rbp+16+8*x]
105 %else
106 %define arg(x) [rbp-8-8*x]
107 %endif
108 %endif
110 ; REG_SZ_BYTES, REG_SZ_BITS
111 ; Size of a register
112 %if ABI_IS_32BIT
113 %define REG_SZ_BYTES 4
114 %define REG_SZ_BITS 32
115 %else
116 %define REG_SZ_BYTES 8
117 %define REG_SZ_BITS 64
118 %endif
121 ; ALIGN_STACK <alignment> <register>
122 ; This macro aligns the stack to the given alignment (in bytes). The stack
123 ; is left such that the previous value of the stack pointer is the first
124 ; argument on the stack (ie, the inverse of this macro is 'pop rsp.')
125 ; This macro uses one temporary register, which is not preserved, and thus
126 ; must be specified as an argument.
127 %macro ALIGN_STACK 2
128 mov %2, rsp
129 and rsp, -%1
130 lea rsp, [rsp - (%1 - REG_SZ_BYTES)]
131 push %2
132 %endmacro
136 ; The Microsoft assembler tries to impose a certain amount of type safety in
137 ; its register usage. YASM doesn't recognize these directives, so we just
138 ; %define them away to maintain as much compatibility as possible with the
139 ; original inline assembler we're porting from.
141 %idefine PTR
142 %idefine XMMWORD
143 %idefine MMWORD
145 ; PIC macros
147 %if ABI_IS_32BIT
148 %if CONFIG_PIC=1
149 %ifidn __OUTPUT_FORMAT__,elf32
150 %define WRT_PLT wrt ..plt
151 %macro GET_GOT 1
152 extern _GLOBAL_OFFSET_TABLE_
153 push %1
154 call %%get_got
155 %%sub_offset:
156 jmp %%exitGG
157 %%get_got:
158 mov %1, [esp]
159 add %1, _GLOBAL_OFFSET_TABLE_ + $$ - %%sub_offset wrt ..gotpc
161 %%exitGG:
162 %undef GLOBAL
163 %define GLOBAL(x) x + %1 wrt ..gotoff
164 %undef RESTORE_GOT
165 %define RESTORE_GOT pop %1
166 %endmacro
167 %elifidn __OUTPUT_FORMAT__,macho32
168 %macro GET_GOT 1
169 push %1
170 call %%get_got
171 %%get_got:
172 pop %1
173 %undef GLOBAL
174 %define GLOBAL(x) x + %1 - %%get_got
175 %undef RESTORE_GOT
176 %define RESTORE_GOT pop %1
177 %endmacro
178 %endif
179 %endif
180 %define HIDDEN_DATA(x) x
181 %else
182 %macro GET_GOT 1
183 %endmacro
184 %define GLOBAL(x) rel x
185 %ifidn __OUTPUT_FORMAT__,elf64
186 %define WRT_PLT wrt ..plt
187 %define HIDDEN_DATA(x) x:data hidden
188 %else
189 %define HIDDEN_DATA(x) x
190 %endif
191 %endif
192 %ifnmacro GET_GOT
193 %macro GET_GOT 1
194 %endmacro
195 %define GLOBAL(x) x
196 %endif
197 %ifndef RESTORE_GOT
198 %define RESTORE_GOT
199 %endif
200 %ifndef WRT_PLT
201 %define WRT_PLT
202 %endif
204 %if ABI_IS_32BIT
205 %macro SHADOW_ARGS_TO_STACK 1
206 %endm
207 %define UNSHADOW_ARGS
208 %else
209 %ifidn __OUTPUT_FORMAT__,x64
210 %macro SHADOW_ARGS_TO_STACK 1 ; argc
211 %if %1 > 0
212 mov arg(0),rcx
213 %endif
214 %if %1 > 1
215 mov arg(1),rdx
216 %endif
217 %if %1 > 2
218 mov arg(2),r8
219 %endif
220 %if %1 > 3
221 mov arg(3),r9
222 %endif
223 %endm
224 %else
225 %macro SHADOW_ARGS_TO_STACK 1 ; argc
226 %if %1 > 0
227 push rdi
228 %endif
229 %if %1 > 1
230 push rsi
231 %endif
232 %if %1 > 2
233 push rdx
234 %endif
235 %if %1 > 3
236 push rcx
237 %endif
238 %if %1 > 4
239 push r8
240 %endif
241 %if %1 > 5
242 push r9
243 %endif
244 %if %1 > 6
245 %assign i %1-6
246 %assign off 16
247 %rep i
248 mov rax,[rbp+off]
249 push rax
250 %assign off off+8
251 %endrep
252 %endif
253 %endm
254 %endif
255 %define UNSHADOW_ARGS mov rsp, rbp
256 %endif
258 ; must keep XMM6:XMM15 (libvpx uses XMM6 and XMM7) on Win64 ABI
259 ; rsp register has to be aligned
260 %ifidn __OUTPUT_FORMAT__,x64
261 %macro SAVE_XMM 0
262 sub rsp, 32
263 movdqu XMMWORD PTR [rsp], xmm6
264 movdqu XMMWORD PTR [rsp+16], xmm7
265 %endmacro
266 %macro RESTORE_XMM 0
267 movdqu xmm6, XMMWORD PTR [rsp]
268 movdqu xmm7, XMMWORD PTR [rsp+16]
269 add rsp, 32
270 %endmacro
271 %else
272 %macro SAVE_XMM 0
273 %endmacro
274 %macro RESTORE_XMM 0
275 %endmacro
276 %endif
278 ; Name of the rodata section
280 ; .rodata seems to be an elf-ism, as it doesn't work on OSX.
282 %ifidn __OUTPUT_FORMAT__,macho64
283 %define SECTION_RODATA section .text
284 %elifidn __OUTPUT_FORMAT__,macho32
285 %macro SECTION_RODATA 0
286 section .text
287 %endmacro
288 %else
289 %define SECTION_RODATA section .rodata
290 %endif
293 ; Tell GNU ld that we don't require an executable stack.
294 %ifidn __OUTPUT_FORMAT__,elf32
295 section .note.GNU-stack noalloc noexec nowrite progbits
296 section .text
297 %elifidn __OUTPUT_FORMAT__,elf64
298 section .note.GNU-stack noalloc noexec nowrite progbits
299 section .text
300 %endif