avcodec/scpr: optimize shift loop.

Speeds code up from 50sec to 15sec Fixes Timeout Fixes: 3242/clusterfuzz-testcase-5811951672229888 Found-by: continuous fuzzing process https://github.com/google/oss-fuzz/tree/master/projects/ffmpeg Reviewed-by: James Almer <jamrial@gmail.com> Signed-off-by: Michael Niedermayer <michael@niedermayer.cc>
author: Michael Niedermayer <michael@niedermayer.cc> 2017-09-08 23:29:13 +0200
committer: Michael Niedermayer <michael@niedermayer.cc> 2017-09-10 19:08:23 +0200
commit: 981f04b2ae2d6e0355386aaff39840eb5d390a36 (patch)
tree: 032c9b815e133f694c7ed61c7399a6a61eca1599 /libavcodec/scpr.c
parent: cbe181c8e1611aaee2a85ab522e17b1322bdd4de (diff)
download: ffmpeg-981f04b2ae2d6e0355386aaff39840eb5d390a36.tar.gz
1 files changed, 12 insertions, 1 deletions
diff --git a/libavcodec/scpr.c b/libavcodec/scpr.c
index 37fbe7a106..cbe1bc40d9 100644
--- a/libavcodec/scpr.c
+++ b/libavcodec/scpr.c
@@ -826,8 +826,19 @@ static int decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
         if (ret < 0)
             return ret;
 
+        // scale up each sample by 8
         for (y = 0; y < avctx->height; y++) {
-            for (x = 0; x < avctx->width * 4; x++) {
+            // If the image is sufficiently aligned, compute 8 samples at once
+            if (!(((uintptr_t)dst) & 7)) {
+                uint64_t *dst64 = (uint64_t *)dst;
+                int w = avctx->width>>1;
+                for (x = 0; x < w; x++) {
+                    dst64[x] = (dst64[x] << 3) & 0xFCFCFCFCFCFCFCFCULL;
+                }
+                x *= 8;
+            } else
+                x = 0;
+            for (; x < avctx->width * 4; x++) {
                 dst[x] = dst[x] << 3;
             }
             dst += frame->linesize[0];
author	Michael Niedermayer <michael@niedermayer.cc>	2017-09-08 23:29:13 +0200
committer	Michael Niedermayer <michael@niedermayer.cc>	2017-09-10 19:08:23 +0200
commit	981f04b2ae2d6e0355386aaff39840eb5d390a36 (patch)
tree	032c9b815e133f694c7ed61c7399a6a61eca1599 /libavcodec/scpr.c
parent	cbe181c8e1611aaee2a85ab522e17b1322bdd4de (diff)
download	ffmpeg-981f04b2ae2d6e0355386aaff39840eb5d390a36.tar.gz