diff options
author | Fabrice Bellard <fabrice@bellard.org> | 2003-01-07 17:41:43 +0000 |
---|---|---|
committer | Fabrice Bellard <fabrice@bellard.org> | 2003-01-07 17:41:43 +0000 |
commit | e1958604fdbf67aa8c300d3700c8805db039919d (patch) | |
tree | 1c45ec4ce762c978ec9d0c19d25ddcc2a98ab980 | |
parent | 52b41d7f70821fa594ee8f5941665005c61260c0 (diff) | |
download | ffmpeg-e1958604fdbf67aa8c300d3700c8805db039919d.tar.gz |
added define for builtins use - inverse fix by Romain Dolbeau
Originally committed as revision 1410 to svn://svn.ffmpeg.org/ffmpeg/trunk
-rw-r--r-- | libavcodec/i386/fft_sse.c | 12 |
1 files changed, 12 insertions, 0 deletions
diff --git a/libavcodec/i386/fft_sse.c b/libavcodec/i386/fft_sse.c index 8e8e36b0f7..175cea506c 100644 --- a/libavcodec/i386/fft_sse.c +++ b/libavcodec/i386/fft_sse.c @@ -19,11 +19,16 @@ #include "../dsputil.h" #include <math.h> +#ifdef HAVE_BUILTIN_VECTOR + #include <xmmintrin.h> static const float p1p1p1m1[4] __attribute__((aligned(16))) = { 1.0, 1.0, 1.0, -1.0 }; +static const float p1p1m1p1[4] __attribute__((aligned(16))) = + { 1.0, 1.0, -1.0, 1.0 }; + static const float p1p1m1m1[4] __attribute__((aligned(16))) = { 1.0, 1.0, -1.0, -1.0 }; @@ -54,6 +59,11 @@ void fft_calc_sse(FFTContext *s, FFTComplex *z) r = (__m128 *)&z[0]; c1 = *(__m128 *)p1p1m1m1; c2 = *(__m128 *)p1p1p1m1; + if (s->inverse) + c2 = *(__m128 *)p1p1m1p1; + else + c2 = *(__m128 *)p1p1p1m1; + j = (np >> 2); do { a = r[0]; @@ -126,3 +136,5 @@ void fft_calc_sse(FFTContext *s, FFTComplex *z) nloops = nloops << 1; } while (nblocks != 0); } + +#endif |