diff options
author | James Almer <jamrial@gmail.com> | 2017-05-12 23:31:30 -0300 |
---|---|---|
committer | James Almer <jamrial@gmail.com> | 2017-05-12 23:34:49 -0300 |
commit | 0fbc7a2169af479f8824f44e1b0f0ede5e1d1eaa (patch) | |
tree | fb3f11496e9f7e91a1f48a3eb7a4e61299280d9f | |
parent | 96cbaaa5481baa020eb0cb6faac83e4c5059b212 (diff) | |
download | ffmpeg-0fbc7a2169af479f8824f44e1b0f0ede5e1d1eaa.tar.gz |
x86/float_dsp: remove usage of integer instructions
-rw-r--r-- | libavutil/x86/float_dsp.asm | 14 |
1 files changed, 7 insertions, 7 deletions
diff --git a/libavutil/x86/float_dsp.asm b/libavutil/x86/float_dsp.asm index edade0d55d..06d2d2cfd1 100644 --- a/libavutil/x86/float_dsp.asm +++ b/libavutil/x86/float_dsp.asm @@ -243,8 +243,8 @@ cglobal vector_dmul_scalar, 4,4,3, dst, src, mul, len .loop: mulpd m1, m0, [srcq+lenq ] mulpd m2, m0, [srcq+lenq+mmsize] - mova [dstq+lenq ], m1 - mova [dstq+lenq+mmsize], m2 + movaps [dstq+lenq ], m1 + movaps [dstq+lenq+mmsize], m2 sub lenq, 2*mmsize jge .loop REP_RET @@ -363,14 +363,14 @@ VECTOR_FMUL_ADD %macro VECTOR_FMUL_REVERSE 0 cglobal vector_fmul_reverse, 4,4,2, dst, src0, src1, len %if cpuflag(avx2) - mova m2, [pd_reverse] + movaps m2, [pd_reverse] %endif lea lenq, [lend*4 - 2*mmsize] ALIGN 16 .loop: %if cpuflag(avx2) - vpermd m0, m2, [src1q] - vpermd m1, m2, [src1q+mmsize] + vpermps m0, m2, [src1q] + vpermps m1, m2, [src1q+mmsize] %elif cpuflag(avx) vmovaps xmm0, [src1q + 16] vinsertf128 m0, m0, [src1q], 1 @@ -386,8 +386,8 @@ ALIGN 16 %endif mulps m0, m0, [src0q + lenq + mmsize] mulps m1, m1, [src0q + lenq] - mova [dstq + lenq + mmsize], m0 - mova [dstq + lenq], m1 + movaps [dstq + lenq + mmsize], m0 + movaps [dstq + lenq], m1 add src1q, 2*mmsize sub lenq, 2*mmsize jge .loop |