diff options
author | Måns Rullgård <mans@mansr.com> | 2010-02-09 16:13:41 +0000 |
---|---|---|
committer | Måns Rullgård <mans@mansr.com> | 2010-02-09 16:13:41 +0000 |
commit | 3132614305a4591c75ac20e4f13d1398e17375b4 (patch) | |
tree | 548e6c5177c38c9c59e911f4994851e4168afec6 | |
parent | f73a626ae4c374546226091c0a74a9053181af1d (diff) | |
download | ffmpeg-3132614305a4591c75ac20e4f13d1398e17375b4.tar.gz |
ARMv6 optimised diff_pixels
Originally committed as revision 21702 to svn://svn.ffmpeg.org/ffmpeg/trunk
-rw-r--r-- | libavcodec/arm/dsputil_armv6.S | 33 | ||||
-rw-r--r-- | libavcodec/arm/dsputil_init_armv6.c | 3 |
2 files changed, 36 insertions, 0 deletions
diff --git a/libavcodec/arm/dsputil_armv6.S b/libavcodec/arm/dsputil_armv6.S index 4c7f44032d..800d8f291c 100644 --- a/libavcodec/arm/dsputil_armv6.S +++ b/libavcodec/arm/dsputil_armv6.S @@ -309,6 +309,39 @@ function ff_get_pixels_armv6, export=1 pop {r4-r8, pc} .endfunc +function ff_diff_pixels_armv6, export=1 + pld [r1, r3] + pld [r2, r3] + push {r4-r9, lr} + mov lr, #8 +1: + ldrd r4, r5, [r1], r3 + ldrd r6, r7, [r2], r3 + uxtb16 r8, r4 + uxtb16 r4, r4, ror #8 + uxtb16 r9, r6 + uxtb16 r6, r6, ror #8 + pld [r1, r3] + ssub16 r9, r8, r9 + ssub16 r6, r4, r6 + uxtb16 r8, r5 + uxtb16 r5, r5, ror #8 + pld [r2, r3] + pkhbt r4, r9, r6, lsl #16 + pkhtb r6, r6, r9, asr #16 + uxtb16 r9, r7 + uxtb16 r7, r7, ror #8 + ssub16 r9, r8, r9 + ssub16 r5, r5, r7 + subs lr, lr, #1 + pkhbt r8, r9, r5, lsl #16 + pkhtb r9, r5, r9, asr #16 + stm r0!, {r4,r6,r8,r9} + bgt 1b + + pop {r4-r9, pc} +.endfunc + function ff_pix_abs16_armv6, export=1 ldr r0, [sp] push {r4-r9, lr} diff --git a/libavcodec/arm/dsputil_init_armv6.c b/libavcodec/arm/dsputil_init_armv6.c index 1e599430f7..43eab46f0a 100644 --- a/libavcodec/arm/dsputil_init_armv6.c +++ b/libavcodec/arm/dsputil_init_armv6.c @@ -51,6 +51,8 @@ void ff_add_pixels_clamped_armv6(const DCTELEM *block, int line_size); void ff_get_pixels_armv6(DCTELEM *block, const uint8_t *pixels, int stride); +void ff_diff_pixels_armv6(DCTELEM *block, const uint8_t *s1, + const uint8_t *s2, int stride); int ff_pix_abs16_armv6(void *s, uint8_t *blk1, uint8_t *blk2, int line_size, int h); @@ -95,6 +97,7 @@ void av_cold ff_dsputil_init_armv6(DSPContext* c, AVCodecContext *avctx) c->add_pixels_clamped = ff_add_pixels_clamped_armv6; c->get_pixels = ff_get_pixels_armv6; + c->diff_pixels = ff_diff_pixels_armv6; c->pix_abs[0][0] = ff_pix_abs16_armv6; c->pix_abs[0][1] = ff_pix_abs16_x2_armv6; |