2 ; Copyright (c) 2010 The WebM project authors. All Rights Reserved.
4 ; Use of this source code is governed by a BSD-style license
5 ; that can be found in the LICENSE file in the root of the source
6 ; tree. An additional intellectual property rights grant can be found
7 ; in the file PATENTS. All contributing project authors may
8 ; be found in the AUTHORS file in the root of the source tree.
12 %include "vpx_config.asm"
14 ; 32/64 bit compatibility macros
16 ; In general, we make the source use 64 bit syntax, then twiddle with it using
17 ; the preprocessor to get the 32 bit syntax on 32 bit platforms.
19 %ifidn __OUTPUT_FORMAT__,elf32
20 %define ABI_IS_32BIT 1
21 %elifidn __OUTPUT_FORMAT__,macho32
22 %define ABI_IS_32BIT 1
23 %elifidn __OUTPUT_FORMAT__,win32
24 %define ABI_IS_32BIT 1
25 %elifidn __OUTPUT_FORMAT__,aout
26 %define ABI_IS_32BIT 1
28 %define ABI_IS_32BIT 0
82 ; Return the proper symbol name for the target ABI.
84 ; Certain ABIs, notably MS COFF and Darwin MACH-O, require that symbols
85 ; with C linkage be prefixed with an underscore.
87 %ifidn __OUTPUT_FORMAT__,elf32
89 %elifidn __OUTPUT_FORMAT__,elf64
91 %elifidn __OUTPUT_FORMAT__,x64
98 ; Macro for the attribute to hide a global symbol for the target ABI.
99 ; This is only active if CHROMIUM is defined.
101 ; Chromium doesn't like exported global symbols due to symbol clashing with
102 ; plugins among other things.
104 ; Requires Chromium's patched copy of yasm:
105 ; http://src.chromium.org/viewvc/chrome?view=rev&revision=73761
106 ; http://www.tortall.net/projects/yasm/ticket/236
109 %ifidn __OUTPUT_FORMAT__,elf32
110 %define PRIVATE :hidden
111 %elifidn __OUTPUT_FORMAT__,elf64
112 %define PRIVATE :hidden
113 %elifidn __OUTPUT_FORMAT__,x64
116 %define PRIVATE :private_extern
123 ; Return the address specification of the given argument
126 %define arg(x) [ebp+8+4*x]
128 ; 64 bit ABI passes arguments in registers. This is a workaround to get up
129 ; and running quickly. Relies on SHADOW_ARGS_TO_STACK
130 %ifidn __OUTPUT_FORMAT__,x64
131 %define arg(x) [rbp+16+8*x]
133 %define arg(x) [rbp-8-8*x]
137 ; REG_SZ_BYTES, REG_SZ_BITS
140 %define REG_SZ_BYTES 4
141 %define REG_SZ_BITS 32
143 %define REG_SZ_BYTES 8
144 %define REG_SZ_BITS 64
148 ; ALIGN_STACK <alignment> <register>
149 ; This macro aligns the stack to the given alignment (in bytes). The stack
150 ; is left such that the previous value of the stack pointer is the first
151 ; argument on the stack (ie, the inverse of this macro is 'pop rsp.')
152 ; This macro uses one temporary register, which is not preserved, and thus
153 ; must be specified as an argument.
157 lea rsp, [rsp - (%1 - REG_SZ_BYTES)]
163 ; The Microsoft assembler tries to impose a certain amount of type safety in
164 ; its register usage. YASM doesn't recognize these directives, so we just
165 ; %define them away to maintain as much compatibility as possible with the
166 ; original inline assembler we're porting from.
176 %ifidn __OUTPUT_FORMAT__,elf32
177 %define GET_GOT_SAVE_ARG 1
178 %define WRT_PLT wrt ..plt
180 extern _GLOBAL_OFFSET_TABLE_
187 add %1, _GLOBAL_OFFSET_TABLE_ + $$ - %%sub_offset wrt ..gotpc
191 %define GLOBAL(x) x + %1 wrt ..gotoff
193 %define RESTORE_GOT pop %1
195 %elifidn __OUTPUT_FORMAT__,macho32
196 %define GET_GOT_SAVE_ARG 1
203 %define GLOBAL(x) x + %1 - %%get_got
205 %define RESTORE_GOT pop %1
211 %ifidn __OUTPUT_FORMAT__,macho32
212 %define HIDDEN_DATA(x) x:private_extern
214 %define HIDDEN_DATA(x) x
217 %define HIDDEN_DATA(x) x
222 %define GLOBAL(x) rel x
223 %ifidn __OUTPUT_FORMAT__,elf64
224 %define WRT_PLT wrt ..plt
225 %define HIDDEN_DATA(x) x:data hidden
227 %define HIDDEN_DATA(x) x
243 %macro SHADOW_ARGS_TO_STACK 1
245 %define UNSHADOW_ARGS
247 %ifidn __OUTPUT_FORMAT__,x64
248 %macro SHADOW_ARGS_TO_STACK 1 ; argc
263 %macro SHADOW_ARGS_TO_STACK 1 ; argc
293 %define UNSHADOW_ARGS mov rsp, rbp
296 ; Win64 ABI requires that XMM6:XMM15 are callee saved
298 ; store registers 6-n on the stack
299 ; if u is specified, use unaligned movs.
300 ; Win64 ABI requires 16 byte stack alignment, but then pushes an 8 byte return
301 ; value. Typically we follow this up with 'push rbp' - re-aligning the stack -
302 ; but in some cases this is not done and unaligned movs must be used.
303 %ifidn __OUTPUT_FORMAT__,x64
304 %macro SAVE_XMM 1-2 a
306 %error Only xmm registers 6-15 must be preserved
309 %define movxmm movdq %+ %2
310 %assign xmm_stack_space ((last_xmm - 5) * 16)
311 sub rsp, xmm_stack_space
314 movxmm [rsp + ((i - 6) * 16)], xmm %+ i
321 %error RESTORE_XMM must be paired with SAVE_XMM n
325 movxmm xmm %+ i, [rsp +((i - 6) * 16)]
328 add rsp, xmm_stack_space
329 ; there are a couple functions which return from multiple places.
330 ; otherwise, we could uncomment these:
332 ; %undef xmm_stack_space
343 ; Name of the rodata section
345 ; .rodata seems to be an elf-ism, as it doesn't work on OSX.
347 %ifidn __OUTPUT_FORMAT__,macho64
348 %define SECTION_RODATA section .text
349 %elifidn __OUTPUT_FORMAT__,macho32
350 %macro SECTION_RODATA 0
353 %elifidn __OUTPUT_FORMAT__,aout
354 %define SECTION_RODATA section .data
356 %define SECTION_RODATA section .rodata
360 ; Tell GNU ld that we don't require an executable stack.
361 %ifidn __OUTPUT_FORMAT__,elf32
362 section .note.GNU-stack noalloc noexec nowrite progbits
364 %elifidn __OUTPUT_FORMAT__,elf64
365 section .note.GNU-stack noalloc noexec nowrite progbits