diff options
author | Henrik Gramner <henrik@gramner.com> | 2013-09-11 17:49:22 +0200 |
---|---|---|
committer | Derek Buitenhuis <derek.buitenhuis@gmail.com> | 2013-10-07 06:24:33 -0400 |
commit | 63f0d623100bdb0c6081456127f4b6713e83d3db (patch) | |
tree | 4719a5d1492baba76c224d1d2e81e6a4aad7f655 | |
parent | ad76e6e7e193b98e7335156422d35467816f9ef1 (diff) | |
download | ffmpeg-63f0d623100bdb0c6081456127f4b6713e83d3db.tar.gz |
x86inc: Use SSE instead of SSE2 for copying data
Reduces code size because movaps/movups is one byte
shorter than movdqa/movdqu.
Signed-off-by: Derek Buitenhuis <derek.buitenhuis@gmail.com>
-rw-r--r-- | libavutil/x86/x86inc.asm | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/libavutil/x86/x86inc.asm b/libavutil/x86/x86inc.asm index b6edfd9373..0c27c60353 100644 --- a/libavutil/x86/x86inc.asm +++ b/libavutil/x86/x86inc.asm @@ -436,7 +436,7 @@ DECLARE_REG 14, R15, 120 %assign %%i xmm_regs_used %rep (xmm_regs_used-6) %assign %%i %%i-1 - movdqa [rsp + (%%i-6)*16 + stack_size + (~stack_offset&8)], xmm %+ %%i + movaps [rsp + (%%i-6)*16 + stack_size + (~stack_offset&8)], xmm %+ %%i %endrep %endmacro @@ -454,7 +454,7 @@ DECLARE_REG 14, R15, 120 %assign %%i xmm_regs_used %rep (xmm_regs_used-6) %assign %%i %%i-1 - movdqa xmm %+ %%i, [%1 + (%%i-6)*16+stack_size+(~stack_offset&8)] + movaps xmm %+ %%i, [%1 + (%%i-6)*16+stack_size+(~stack_offset&8)] %endrep %if stack_size_padded == 0 add %1, (xmm_regs_used-6)*16+16 |