diff options
author | Janne Grunau <janne-libav@jannau.net> | 2014-04-28 17:56:43 +0200 |
---|---|---|
committer | Janne Grunau <janne-libav@jannau.net> | 2014-05-15 18:17:02 +0200 |
commit | d3f5b94762fb803c0f3b29f9ad6c5eaa813998ba (patch) | |
tree | 62d2b426d38f8540bdcfb5e126666c89e4cdb279 /libavcodec/aarch64/opus_imdct_init.c | |
parent | 7c5ca546a0747a20c7f7fb5550455c3042699ee9 (diff) | |
download | ffmpeg-d3f5b94762fb803c0f3b29f9ad6c5eaa813998ba.tar.gz |
aarch64: opus NEON iMDCT and FFT
Opus celt decoding 11% faster and the iMDCT over 2.5 times faster on
Apple's A7.
Diffstat (limited to 'libavcodec/aarch64/opus_imdct_init.c')
-rw-r--r-- | libavcodec/aarch64/opus_imdct_init.c | 45 |
1 files changed, 45 insertions, 0 deletions
diff --git a/libavcodec/aarch64/opus_imdct_init.c b/libavcodec/aarch64/opus_imdct_init.c new file mode 100644 index 0000000000..1a776dca00 --- /dev/null +++ b/libavcodec/aarch64/opus_imdct_init.c @@ -0,0 +1,45 @@ +/* + * This file is part of Libav. + * + * Libav is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * Libav is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with Libav; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#include <stddef.h> + +#include "libavutil/cpu.h" +#include "libavutil/aarch64/cpu.h" +#include "libavutil/internal.h" +#include "libavcodec/opus_imdct.h" + +#include "asm-offsets.h" + +AV_CHECK_OFFSET(CeltIMDCTContext, exptab, CELT_EXPTAB); +AV_CHECK_OFFSET(CeltIMDCTContext, fft_n, CELT_FFT_N); +AV_CHECK_OFFSET(CeltIMDCTContext, len2, CELT_LEN2); +AV_CHECK_OFFSET(CeltIMDCTContext, len4, CELT_LEN4); +AV_CHECK_OFFSET(CeltIMDCTContext, tmp, CELT_TMP); +AV_CHECK_OFFSET(CeltIMDCTContext, twiddle_exptab, CELT_TWIDDLE); + +void ff_celt_imdct_half_neon(CeltIMDCTContext *s, float *dst, const float *src, + ptrdiff_t stride, float scale); + +void ff_celt_imdct_init_aarch64(CeltIMDCTContext *s) +{ + int cpu_flags = av_get_cpu_flags(); + + if (have_neon(cpu_flags)) { + s->imdct_half = ff_celt_imdct_half_neon; + } +} |