diff options
author | Loren Merritt <lorenm@u.washington.edu> | 2013-06-18 21:30:42 +0000 |
---|---|---|
committer | Luca Barbato <lu_zero@gentoo.org> | 2013-06-29 13:23:57 +0200 |
commit | 502ab21af0ca68f76d6112722c46d2f35c004053 (patch) | |
tree | c68ce5c0c787fc552cf572e4aeb3b14f4d80b8a0 /libavutil/lls.h | |
parent | 41578f70cf8aec8e7565fba1ca7e07f3dc46c3d2 (diff) | |
download | ffmpeg-502ab21af0ca68f76d6112722c46d2f35c004053.tar.gz |
x86: lpc: simd av_update_lls
4x-6x faster on sandybridge
Signed-off-by: Luca Barbato <lu_zero@gentoo.org>
Diffstat (limited to 'libavutil/lls.h')
-rw-r--r-- | libavutil/lls.h | 12 |
1 files changed, 9 insertions, 3 deletions
diff --git a/libavutil/lls.h b/libavutil/lls.h index 81834402f7..27c0d5e3fe 100644 --- a/libavutil/lls.h +++ b/libavutil/lls.h @@ -23,9 +23,12 @@ #ifndef AVUTIL_LLS_H #define AVUTIL_LLS_H +#include "common.h" +#include "mem.h" #include "version.h" #define MAX_VARS 32 +#define MAX_VARS_ALIGN FFALIGN(MAX_VARS+1,4) //FIXME avoid direct access to LLSModel from outside @@ -33,26 +36,29 @@ * Linear least squares model. */ typedef struct LLSModel { - double covariance[MAX_VARS + 1][MAX_VARS + 1]; - double coeff[MAX_VARS][MAX_VARS]; + DECLARE_ALIGNED(32, double, covariance[MAX_VARS_ALIGN][MAX_VARS_ALIGN]); + DECLARE_ALIGNED(32, double, coeff[MAX_VARS][MAX_VARS]); double variance[MAX_VARS]; int indep_count; /** * Take the outer-product of var[] with itself, and add to the covariance matrix. * @param m this context * @param var training samples, starting with the value to be predicted + * 32-byte aligned, and any padding elements must be initialized + * (i.e not denormal/nan). */ void (*update_lls)(struct LLSModel *m, double *var); /** * Inner product of var[] and the LPC coefs. * @param m this context - * @param var training samples, excluding the value to be predicted + * @param var training samples, excluding the value to be predicted. unaligned. * @param order lpc order */ double (*evaluate_lls)(struct LLSModel *m, double *var, int order); } LLSModel; void avpriv_init_lls(LLSModel *m, int indep_count); +void ff_init_lls_x86(LLSModel *m); void avpriv_solve_lls(LLSModel *m, double threshold, unsigned short min_order); #if FF_API_LLS_PRIVATE |