diff options
author | Michael Niedermayer <michael@niedermayer.cc> | 2019-01-17 22:35:10 +0100 |
---|---|---|
committer | Michael Niedermayer <michael@niedermayer.cc> | 2019-12-02 19:41:47 +0100 |
commit | af857cb62f93f6e8c3469ff667ade90b9ac3665b (patch) | |
tree | ed84b21105ad985b8ae3b17b277653793e077802 | |
parent | d9590afafcc3451dc5a43270b1445b5ec0944f30 (diff) | |
download | ffmpeg-af857cb62f93f6e8c3469ff667ade90b9ac3665b.tar.gz |
avutil/mem: Optimize fill32() by unrolling and using 64bit
Reviewed-by: Marton Balint <cus@passwd.hu>
Signed-off-by: Michael Niedermayer <michael@niedermayer.cc>
(cherry picked from commit 12b1338be376a3e5fb606d9fe41b58dc4a9e62c7)
Signed-off-by: Michael Niedermayer <michael@niedermayer.cc>
-rw-r--r-- | libavutil/mem.c | 12 |
1 files changed, 12 insertions, 0 deletions
diff --git a/libavutil/mem.c b/libavutil/mem.c index 323b18311b..4a9bb963db 100644 --- a/libavutil/mem.c +++ b/libavutil/mem.c @@ -415,6 +415,18 @@ static void fill32(uint8_t *dst, int len) { uint32_t v = AV_RN32(dst - 4); +#if HAVE_FAST_64BIT + uint64_t v2= v + ((uint64_t)v<<32); + while (len >= 32) { + AV_WN64(dst , v2); + AV_WN64(dst+ 8, v2); + AV_WN64(dst+16, v2); + AV_WN64(dst+24, v2); + dst += 32; + len -= 32; + } +#endif + while (len >= 4) { AV_WN32(dst, v); dst += 4; |