Add float_interleave() to FmtConvertContext with x86-optimized versions.

Partially based on patches by clsid2 in ffdshow-tryout. ff_float_interleave6() x86 improvements by Loren Merrit.
author: Justin Ruggles <justin.ruggles@gmail.com> 2011-04-24 17:50:17 -0400
committer: Justin Ruggles <justin.ruggles@gmail.com> 2011-05-18 17:27:05 -0400
commit: 32f8fb8ecf8178b9c9ec8d7152f1fdd8537f7f3a (patch)
tree: 75ece9cd372dafb36670424033068b6edafaceda /libavcodec/x86/fmtconvert_mmx.c
parent: f907ad9b85d5e08e4a024e24734181940cd4fc48 (diff)
download: ffmpeg-32f8fb8ecf8178b9c9ec8d7152f1fdd8537f7f3a.tar.gz
1 files changed, 30 insertions, 0 deletions
diff --git a/libavcodec/x86/fmtconvert_mmx.c b/libavcodec/x86/fmtconvert_mmx.c
index 847bd80fcd..61a4272a69 100644
--- a/libavcodec/x86/fmtconvert_mmx.c
+++ b/libavcodec/x86/fmtconvert_mmx.c
@@ -235,11 +235,40 @@ static void float_to_int16_interleave_3dn2(int16_t *dst, const float **src, long
         float_to_int16_interleave_3dnow(dst, src, len, channels);
 }
 
+void ff_float_interleave2_mmx(float *dst, const float **src, unsigned int len);
+void ff_float_interleave2_sse(float *dst, const float **src, unsigned int len);
+
+void ff_float_interleave6_mmx(float *dst, const float **src, unsigned int len);
+void ff_float_interleave6_sse(float *dst, const float **src, unsigned int len);
+
+static void float_interleave_mmx(float *dst, const float **src,
+                                 unsigned int len, int channels)
+{
+    if (channels == 2) {
+        ff_float_interleave2_mmx(dst, src, len);
+    } else if (channels == 6)
+        ff_float_interleave6_mmx(dst, src, len);
+    else
+        ff_float_interleave_c(dst, src, len, channels);
+}
+
+static void float_interleave_sse(float *dst, const float **src,
+                                 unsigned int len, int channels)
+{
+    if (channels == 2) {
+        ff_float_interleave2_sse(dst, src, len);
+    } else if (channels == 6)
+        ff_float_interleave6_sse(dst, src, len);
+    else
+        ff_float_interleave_c(dst, src, len, channels);
+}
+
 void ff_fmt_convert_init_x86(FmtConvertContext *c, AVCodecContext *avctx)
 {
     int mm_flags = av_get_cpu_flags();
 
     if (mm_flags & AV_CPU_FLAG_MMX) {
+        c->float_interleave = float_interleave_mmx;
 
         if(mm_flags & AV_CPU_FLAG_3DNOW){
             if(!(avctx->flags & CODEC_FLAG_BITEXACT)){
@@ -256,6 +285,7 @@ void ff_fmt_convert_init_x86(FmtConvertContext *c, AVCodecContext *avctx)
             c->int32_to_float_fmul_scalar = int32_to_float_fmul_scalar_sse;
             c->float_to_int16 = float_to_int16_sse;
             c->float_to_int16_interleave = float_to_int16_interleave_sse;
+            c->float_interleave = float_interleave_sse;
         }
         if(mm_flags & AV_CPU_FLAG_SSE2){
             c->int32_to_float_fmul_scalar = int32_to_float_fmul_scalar_sse2;
author	Justin Ruggles <justin.ruggles@gmail.com>	2011-04-24 17:50:17 -0400
committer	Justin Ruggles <justin.ruggles@gmail.com>	2011-05-18 17:27:05 -0400
commit	32f8fb8ecf8178b9c9ec8d7152f1fdd8537f7f3a (patch)
tree	75ece9cd372dafb36670424033068b6edafaceda /libavcodec/x86/fmtconvert_mmx.c
parent	f907ad9b85d5e08e4a024e24734181940cd4fc48 (diff)
download	ffmpeg-32f8fb8ecf8178b9c9ec8d7152f1fdd8537f7f3a.tar.gz