aboutsummaryrefslogtreecommitdiffstats
path: root/libavcodec/x86/sbrdsp_init.c
diff options
context:
space:
mode:
authorChristophe Gisquet <christophe.gisquet@gmail.com>2012-02-24 22:11:19 +0100
committerDiego Biurrun <diego@biurrun.de>2012-12-07 11:04:26 +0100
commit2aef3d66c9cdf9d9ad3ecec2fb0c6b3020e9d3b0 (patch)
tree4e40bc1d24002be20fa1b0592a5b66e4cb9657d2 /libavcodec/x86/sbrdsp_init.c
parent9a16359c38888af6beab7e688fc55eaa60c835ec (diff)
downloadffmpeg-2aef3d66c9cdf9d9ad3ecec2fb0c6b3020e9d3b0.tar.gz
SBR DSP x86: implement SSE sbr_hf_gen
Start and end index are multiple of 2, therefore guaranteeing aligned access. Also, this allows to generate 4 floats per loop, keeping the alignment all along. Timing: - 32 bits: 326c -> 172c - 64 bits: 323c -> 156c Signed-off-by: Diego Biurrun <diego@biurrun.de>
Diffstat (limited to 'libavcodec/x86/sbrdsp_init.c')
-rw-r--r--libavcodec/x86/sbrdsp_init.c4
1 files changed, 4 insertions, 0 deletions
diff --git a/libavcodec/x86/sbrdsp_init.c b/libavcodec/x86/sbrdsp_init.c
index d272896704..51c4bd4a16 100644
--- a/libavcodec/x86/sbrdsp_init.c
+++ b/libavcodec/x86/sbrdsp_init.c
@@ -27,6 +27,9 @@
float ff_sbr_sum_square_sse(float (*x)[2], int n);
void ff_sbr_hf_g_filt_sse(float (*Y)[2], const float (*X_high)[40][2],
const float *g_filt, int m_max, intptr_t ixh);
+void ff_sbr_hf_gen_sse(float (*X_high)[2], const float (*X_low)[2],
+ const float alpha0[2], const float alpha1[2],
+ float bw, int start, int end);
void ff_sbrdsp_init_x86(SBRDSPContext *s)
{
@@ -35,5 +38,6 @@ void ff_sbrdsp_init_x86(SBRDSPContext *s)
if (EXTERNAL_SSE(mm_flags)) {
s->sum_square = ff_sbr_sum_square_sse;
s->hf_g_filt = ff_sbr_hf_g_filt_sse;
+ s->hf_gen = ff_sbr_hf_gen_sse;
}
}