blob: 7382a913454916c4d00b127e1eb60b4df2550e7b [file] [log] [blame]
John Koleszar0ea50ce2010-05-18 11:58:33 -04001;
John Koleszarc2140b82010-09-09 08:16:39 -04002; Copyright (c) 2010 The WebM project authors. All Rights Reserved.
John Koleszar0ea50ce2010-05-18 11:58:33 -04003;
John Koleszar94c52e42010-06-18 12:39:21 -04004; Use of this source code is governed by a BSD-style license
John Koleszar09202d82010-06-04 16:19:40 -04005; that can be found in the LICENSE file in the root of the source
6; tree. An additional intellectual property rights grant can be found
John Koleszar94c52e42010-06-18 12:39:21 -04007; in the file PATENTS. All contributing project authors may
John Koleszar09202d82010-06-04 16:19:40 -04008; be found in the AUTHORS file in the root of the source tree.
John Koleszar0ea50ce2010-05-18 11:58:33 -04009;
10
11
12%include "vpx_config.asm"
13
14; 32/64 bit compatibility macros
15;
16; In general, we make the source use 64 bit syntax, then twiddle with it using
17; the preprocessor to get the 32 bit syntax on 32 bit platforms.
18;
19%ifidn __OUTPUT_FORMAT__,elf32
20%define ABI_IS_32BIT 1
21%elifidn __OUTPUT_FORMAT__,macho32
22%define ABI_IS_32BIT 1
23%elifidn __OUTPUT_FORMAT__,win32
24%define ABI_IS_32BIT 1
25%else
26%define ABI_IS_32BIT 0
27%endif
28
29%if ABI_IS_32BIT
30%define rax eax
31%define rbx ebx
32%define rcx ecx
33%define rdx edx
34%define rsi esi
35%define rdi edi
36%define rsp esp
37%define rbp ebp
38%define movsxd mov
Jan Kratochvile114f692010-10-04 23:19:33 +020039%macro movq 2
40 %ifidn %1,eax
41 movd %1,%2
42 %elifidn %2,eax
43 movd %1,%2
44 %elifidn %1,ebx
45 movd %1,%2
46 %elifidn %2,ebx
47 movd %1,%2
48 %elifidn %1,ecx
49 movd %1,%2
50 %elifidn %2,ecx
51 movd %1,%2
52 %elifidn %1,edx
53 movd %1,%2
54 %elifidn %2,edx
55 movd %1,%2
56 %elifidn %1,esi
57 movd %1,%2
58 %elifidn %2,esi
59 movd %1,%2
60 %elifidn %1,edi
61 movd %1,%2
62 %elifidn %2,edi
63 movd %1,%2
64 %elifidn %1,esp
65 movd %1,%2
66 %elifidn %2,esp
67 movd %1,%2
68 %elifidn %1,ebp
69 movd %1,%2
70 %elifidn %2,ebp
71 movd %1,%2
72 %else
73 movq %1,%2
74 %endif
75%endmacro
John Koleszar0ea50ce2010-05-18 11:58:33 -040076%endif
77
78
79; sym()
80; Return the proper symbol name for the target ABI.
81;
82; Certain ABIs, notably MS COFF and Darwin MACH-O, require that symbols
83; with C linkage be prefixed with an underscore.
84;
85%ifidn __OUTPUT_FORMAT__,elf32
86%define sym(x) x
87%elifidn __OUTPUT_FORMAT__,elf64
88%define sym(x) x
89%elifidn __OUTPUT_FORMAT__,x64
90%define sym(x) x
91%else
92%define sym(x) _ %+ x
93%endif
94
95; arg()
96; Return the address specification of the given argument
97;
98%if ABI_IS_32BIT
99 %define arg(x) [ebp+8+4*x]
100%else
101 ; 64 bit ABI passes arguments in registers. This is a workaround to get up
102 ; and running quickly. Relies on SHADOW_ARGS_TO_STACK
103 %ifidn __OUTPUT_FORMAT__,x64
104 %define arg(x) [rbp+16+8*x]
105 %else
106 %define arg(x) [rbp-8-8*x]
107 %endif
108%endif
109
110; REG_SZ_BYTES, REG_SZ_BITS
111; Size of a register
112%if ABI_IS_32BIT
113%define REG_SZ_BYTES 4
114%define REG_SZ_BITS 32
115%else
116%define REG_SZ_BYTES 8
117%define REG_SZ_BITS 64
118%endif
119
120
121; ALIGN_STACK <alignment> <register>
122; This macro aligns the stack to the given alignment (in bytes). The stack
123; is left such that the previous value of the stack pointer is the first
124; argument on the stack (ie, the inverse of this macro is 'pop rsp.')
125; This macro uses one temporary register, which is not preserved, and thus
126; must be specified as an argument.
127%macro ALIGN_STACK 2
128 mov %2, rsp
129 and rsp, -%1
Fritz Koenig746439e2010-09-14 15:46:37 -0700130 lea rsp, [rsp - (%1 - REG_SZ_BYTES)]
John Koleszar0ea50ce2010-05-18 11:58:33 -0400131 push %2
132%endmacro
133
134
135;
136; The Microsoft assembler tries to impose a certain amount of type safety in
137; its register usage. YASM doesn't recognize these directives, so we just
138; %define them away to maintain as much compatibility as possible with the
139; original inline assembler we're porting from.
140;
141%idefine PTR
142%idefine XMMWORD
143%idefine MMWORD
144
John Koleszar0ea50ce2010-05-18 11:58:33 -0400145; PIC macros
146;
147%if ABI_IS_32BIT
148 %if CONFIG_PIC=1
149 %ifidn __OUTPUT_FORMAT__,elf32
Ronald S. Bultjec8a23ad2011-06-30 14:04:27 -0700150 %define GET_GOT_SAVE_ARG 1
John Koleszar0ea50ce2010-05-18 11:58:33 -0400151 %define WRT_PLT wrt ..plt
152 %macro GET_GOT 1
153 extern _GLOBAL_OFFSET_TABLE_
154 push %1
155 call %%get_got
Fritz Koenig746439e2010-09-14 15:46:37 -0700156 %%sub_offset:
157 jmp %%exitGG
John Koleszar0ea50ce2010-05-18 11:58:33 -0400158 %%get_got:
Fritz Koenig746439e2010-09-14 15:46:37 -0700159 mov %1, [esp]
160 add %1, _GLOBAL_OFFSET_TABLE_ + $$ - %%sub_offset wrt ..gotpc
161 ret
162 %%exitGG:
John Koleszar0ea50ce2010-05-18 11:58:33 -0400163 %undef GLOBAL
Jan Kratochvil5cdc3a42010-10-04 23:18:58 +0200164 %define GLOBAL(x) x + %1 wrt ..gotoff
John Koleszar0ea50ce2010-05-18 11:58:33 -0400165 %undef RESTORE_GOT
166 %define RESTORE_GOT pop %1
167 %endmacro
168 %elifidn __OUTPUT_FORMAT__,macho32
Ronald S. Bultjec8a23ad2011-06-30 14:04:27 -0700169 %define GET_GOT_SAVE_ARG 1
John Koleszar0ea50ce2010-05-18 11:58:33 -0400170 %macro GET_GOT 1
171 push %1
172 call %%get_got
173 %%get_got:
Rafael Ávila de Espíndola52f6e282011-03-05 15:36:40 -0500174 pop %1
John Koleszar0ea50ce2010-05-18 11:58:33 -0400175 %undef GLOBAL
Rafael Ávila de Espíndola52f6e282011-03-05 15:36:40 -0500176 %define GLOBAL(x) x + %1 - %%get_got
John Koleszar0ea50ce2010-05-18 11:58:33 -0400177 %undef RESTORE_GOT
178 %define RESTORE_GOT pop %1
179 %endmacro
180 %endif
181 %endif
Jan Kratochvil0e8f1082010-07-31 17:12:31 +0200182 %define HIDDEN_DATA(x) x
John Koleszar0ea50ce2010-05-18 11:58:33 -0400183%else
184 %macro GET_GOT 1
185 %endmacro
Jan Kratochvil5cdc3a42010-10-04 23:18:58 +0200186 %define GLOBAL(x) rel x
John Koleszar0ea50ce2010-05-18 11:58:33 -0400187 %ifidn __OUTPUT_FORMAT__,elf64
188 %define WRT_PLT wrt ..plt
Jan Kratochvil0e8f1082010-07-31 17:12:31 +0200189 %define HIDDEN_DATA(x) x:data hidden
Timothy B. Terriberry9f814632010-06-17 19:33:52 -0700190 %else
Jan Kratochvil0e8f1082010-07-31 17:12:31 +0200191 %define HIDDEN_DATA(x) x
John Koleszar0ea50ce2010-05-18 11:58:33 -0400192 %endif
193%endif
194%ifnmacro GET_GOT
195 %macro GET_GOT 1
196 %endmacro
Jan Kratochvil5cdc3a42010-10-04 23:18:58 +0200197 %define GLOBAL(x) x
John Koleszar0ea50ce2010-05-18 11:58:33 -0400198%endif
199%ifndef RESTORE_GOT
200%define RESTORE_GOT
201%endif
202%ifndef WRT_PLT
203%define WRT_PLT
204%endif
205
206%if ABI_IS_32BIT
207 %macro SHADOW_ARGS_TO_STACK 1
208 %endm
209 %define UNSHADOW_ARGS
210%else
211%ifidn __OUTPUT_FORMAT__,x64
212 %macro SHADOW_ARGS_TO_STACK 1 ; argc
213 %if %1 > 0
214 mov arg(0),rcx
215 %endif
216 %if %1 > 1
217 mov arg(1),rdx
218 %endif
219 %if %1 > 2
220 mov arg(2),r8
221 %endif
222 %if %1 > 3
223 mov arg(3),r9
224 %endif
225 %endm
226%else
227 %macro SHADOW_ARGS_TO_STACK 1 ; argc
228 %if %1 > 0
229 push rdi
230 %endif
231 %if %1 > 1
232 push rsi
233 %endif
234 %if %1 > 2
235 push rdx
236 %endif
237 %if %1 > 3
238 push rcx
239 %endif
240 %if %1 > 4
241 push r8
242 %endif
243 %if %1 > 5
244 push r9
245 %endif
246 %if %1 > 6
Scott LaVarnway48c84d12010-06-14 14:07:56 -0400247 %assign i %1-6
248 %assign off 16
249 %rep i
250 mov rax,[rbp+off]
John Koleszar0ea50ce2010-05-18 11:58:33 -0400251 push rax
Scott LaVarnway48c84d12010-06-14 14:07:56 -0400252 %assign off off+8
253 %endrep
John Koleszar0ea50ce2010-05-18 11:58:33 -0400254 %endif
255 %endm
256%endif
257 %define UNSHADOW_ARGS mov rsp, rbp
258%endif
259
Johann4a2b6842011-04-15 10:05:20 -0400260; Win64 ABI requires that XMM6:XMM15 are callee saved
261; SAVE_XMM n, [u]
262; store registers 6-n on the stack
263; if u is specified, use unaligned movs.
264; Win64 ABI requires 16 byte stack alignment, but then pushes an 8 byte return
265; value. Typically we follow this up with 'push rbp' - re-aligning the stack -
266; but in some cases this is not done and unaligned movs must be used.
Makoto Kato63ea8702010-06-11 18:32:28 +0900267%ifidn __OUTPUT_FORMAT__,x64
Johann4a2b6842011-04-15 10:05:20 -0400268%macro SAVE_XMM 1-2 a
269 %if %1 < 6
270 %error Only xmm registers 6-15 must be preserved
271 %else
272 %assign last_xmm %1
273 %define movxmm movdq %+ %2
274 %assign xmm_stack_space ((last_xmm - 5) * 16)
275 sub rsp, xmm_stack_space
276 %assign i 6
277 %rep (last_xmm - 5)
278 movxmm [rsp + ((i - 6) * 16)], xmm %+ i
279 %assign i i+1
280 %endrep
281 %endif
Makoto Kato63ea8702010-06-11 18:32:28 +0900282%endmacro
283%macro RESTORE_XMM 0
Johann4a2b6842011-04-15 10:05:20 -0400284 %ifndef last_xmm
285 %error RESTORE_XMM must be paired with SAVE_XMM n
286 %else
287 %assign i last_xmm
288 %rep (last_xmm - 5)
289 movxmm xmm %+ i, [rsp +((i - 6) * 16)]
290 %assign i i-1
291 %endrep
292 add rsp, xmm_stack_space
293 ; there are a couple functions which return from multiple places.
294 ; otherwise, we could uncomment these:
295 ; %undef last_xmm
296 ; %undef xmm_stack_space
297 ; %undef movxmm
298 %endif
Makoto Kato63ea8702010-06-11 18:32:28 +0900299%endmacro
300%else
Johann4a2b6842011-04-15 10:05:20 -0400301%macro SAVE_XMM 1-2
Makoto Kato63ea8702010-06-11 18:32:28 +0900302%endmacro
303%macro RESTORE_XMM 0
304%endmacro
305%endif
John Koleszar0ea50ce2010-05-18 11:58:33 -0400306
307; Name of the rodata section
308;
309; .rodata seems to be an elf-ism, as it doesn't work on OSX.
310;
311%ifidn __OUTPUT_FORMAT__,macho64
312%define SECTION_RODATA section .text
313%elifidn __OUTPUT_FORMAT__,macho32
314%macro SECTION_RODATA 0
315section .text
John Koleszar0ea50ce2010-05-18 11:58:33 -0400316%endmacro
317%else
318%define SECTION_RODATA section .rodata
319%endif
John Koleszarc3c870e2010-05-27 08:56:34 -0400320
321
322; Tell GNU ld that we don't require an executable stack.
323%ifidn __OUTPUT_FORMAT__,elf32
324section .note.GNU-stack noalloc noexec nowrite progbits
325section .text
326%elifidn __OUTPUT_FORMAT__,elf64
327section .note.GNU-stack noalloc noexec nowrite progbits
328section .text
329%endif
330