diff options
author | James Almer <jamrial@gmail.com> | 2015-02-15 23:16:25 -0300 |
---|---|---|
committer | James Almer <jamrial@gmail.com> | 2015-02-16 00:41:21 -0300 |
commit | 03adafb318e4746030d84f8b85047ab4958cff0f (patch) | |
tree | 8896642a16920ed756673d8664ec1b1dd1ac44f7 /libavcodec/x86/g722dsp.asm | |
parent | e97a9666ef4511cc34637dc7b064b0a6a4565d0f (diff) | |
download | ffmpeg-03adafb318e4746030d84f8b85047ab4958cff0f.tar.gz |
x86/g722dsp: add ff_g722_apply_qmf_sse2
Reviewed-by: Michael Niedermayer <michaelni@gmx.at>
Signed-off-by: James Almer <jamrial@gmail.com>
Diffstat (limited to 'libavcodec/x86/g722dsp.asm')
-rw-r--r-- | libavcodec/x86/g722dsp.asm | 54 |
1 files changed, 54 insertions, 0 deletions
diff --git a/libavcodec/x86/g722dsp.asm b/libavcodec/x86/g722dsp.asm new file mode 100644 index 0000000000..807a1bdd0a --- /dev/null +++ b/libavcodec/x86/g722dsp.asm @@ -0,0 +1,54 @@ +;****************************************************************************** +;* SIMD optimized DSP functions for G722 coding +;* +;* Copyright (c) 2014 James Almer +;* +;* This file is part of FFmpeg. +;* +;* FFmpeg is free software; you can redistribute it and/or +;* modify it under the terms of the GNU Lesser General Public +;* License as published by the Free Software Foundation; either +;* version 2.1 of the License, or (at your option) any later version. +;* +;* FFmpeg is distributed in the hope that it will be useful, +;* but WITHOUT ANY WARRANTY; without even the implied warranty of +;* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +;* Lesser General Public License for more details. +;* +;* You should have received a copy of the GNU Lesser General Public +;* License along with FFmpeg; if not, write to the Free Software +;* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA +;****************************************************************************** + +%include "libavutil/x86/x86util.asm" + +SECTION_RODATA + +pw_qmf_coeffs: dw 3, -210, -11, -805, -11, 951, 53, 3876 +pw_qmf_coeffs2: dw 12, 3876, -156, 951, 32, -805, 362, -210 +pw_qmf_coeffs3: dw 362, 0 , 32, 0, -156, 0, 12, 0 +pw_qmf_coeffs4: dw 53, 0, -11, 0, -11, 0, 3, 0 + +SECTION_TEXT + +INIT_XMM sse2 +cglobal g722_apply_qmf, 2, 2, 5, prev, out + movu m0, [prevq+mmsize*0] + movu m1, [prevq+mmsize*1] + movu m2, [prevq+mmsize*2] + punpcklwd m3, m0, m1 + punpckhwd m0, m1 + punpcklwd m4, m2, m2 + punpckhwd m2, m2 + pmaddwd m3, [pw_qmf_coeffs ] + pmaddwd m0, [pw_qmf_coeffs2] + pmaddwd m4, [pw_qmf_coeffs3] + pmaddwd m2, [pw_qmf_coeffs4] + paddd m0, m3 + paddd m2, m4 + paddd m0, m2 + pshufd m2, m0, q0032 + paddd m0, m2 + pshufd m0, m0, q0001 + movq [outq], m0 + RET |