diff options
author | James Almer <jamrial@gmail.com> | 2015-01-09 16:51:13 -0300 |
---|---|---|
committer | James Almer <jamrial@gmail.com> | 2015-01-09 20:02:27 -0300 |
commit | da02ee127a21d029763011d99f7eb4e66d3f49b3 (patch) | |
tree | 431a303b20046194c0dbb4cfdaac5459c06c510f /libavfilter/x86/vf_pp7.asm | |
parent | f95cd5a235bae89510cfe4320f2189c9cfbcc457 (diff) | |
download | ffmpeg-da02ee127a21d029763011d99f7eb4e66d3f49b3.tar.gz |
x86/vf_pp7: port dctB_mmx to yasm
Reviewed-by: Michael Niedermayer <michaelni@gmx.at>
Signed-off-by: James Almer <jamrial@gmail.com>
Diffstat (limited to 'libavfilter/x86/vf_pp7.asm')
-rw-r--r-- | libavfilter/x86/vf_pp7.asm | 57 |
1 files changed, 57 insertions, 0 deletions
diff --git a/libavfilter/x86/vf_pp7.asm b/libavfilter/x86/vf_pp7.asm new file mode 100644 index 0000000000..7b3e5cf5e3 --- /dev/null +++ b/libavfilter/x86/vf_pp7.asm @@ -0,0 +1,57 @@ +;***************************************************************************** +;* x86-optimized functions for pp7 filter +;* +;* Copyright (c) 2005 Michael Niedermayer <michaelni@gmx.at> +;* +;* This file is part of FFmpeg. +;* +;* FFmpeg is free software; you can redistribute it and/or modify +;* it under the terms of the GNU General Public License as published by +;* the Free Software Foundation; either version 2 of the License, or +;* (at your option) any later version. +;* +;* FFmpeg is distributed in the hope that it will be useful, +;* but WITHOUT ANY WARRANTY; without even the implied warranty of +;* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +;* GNU General Public License for more details. +;* +;* You should have received a copy of the GNU General Public License along +;* with FFmpeg; if not, write to the Free Software Foundation, Inc., +;* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. +;****************************************************************************** + +%include "libavutil/x86/x86util.asm" + +SECTION .text + +INIT_MMX mmx + +;void ff_pp7_dctB_mmx(int16_t *dst, int16_t *src) +cglobal pp7_dctB, 2, 2, 0, dst, src + movq m0, [srcq] + movq m1, [srcq+mmsize*1] + paddw m0, [srcq+mmsize*6] + paddw m1, [srcq+mmsize*5] + movq m2, [srcq+mmsize*2] + movq m3, [srcq+mmsize*3] + paddw m2, [srcq+mmsize*4] + paddw m3, m3 + movq m4, m3 + psubw m3, m0 + paddw m4, m0 + movq m0, m2 + psubw m2, m1 + paddw m0, m1 + movq m1, m4 + psubw m4, m0 + paddw m1, m0 + movq m0, m3 + psubw m3, m2 + psubw m3, m2 + paddw m2, m0 + paddw m2, m0 + movq [dstq], m1 + movq [dstq+mmsize*2], m4 + movq [dstq+mmsize*1], m2 + movq [dstq+mmsize*3], m3 + RET |