aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMartin Vignali <martin.vignali@gmail.com>2019-02-26 10:38:25 +0100
committerMartin Vignali <martin.vignali@gmail.com>2019-03-04 13:03:47 +0100
commit88d0be1c0eea482e160f90d931547803df2df8d6 (patch)
tree30a95ec7373abaf86e0f93596e41ebb18f58130f
parent3278ea67c8f2a7c1aea8fd3114b35983791e6732 (diff)
downloadffmpeg-88d0be1c0eea482e160f90d931547803df2df8d6.tar.gz
avcodec/qtrle : improve 24bbp decoding speed
benchmark on x86_64 : mainly raw data : 20 -> 39 fps mainly rle data : 97 -> 119fps
-rw-r--r--libavcodec/qtrle.c31
1 files changed, 19 insertions, 12 deletions
diff --git a/libavcodec/qtrle.c b/libavcodec/qtrle.c
index febfea3029..a744d7ba68 100644
--- a/libavcodec/qtrle.c
+++ b/libavcodec/qtrle.c
@@ -297,10 +297,11 @@ static void qtrle_decode_16bpp(QtrleContext *s, int row_ptr, int lines_to_change
static void qtrle_decode_24bpp(QtrleContext *s, int row_ptr, int lines_to_change)
{
- int rle_code;
+ int rle_code, rle_code_half;
int pixel_ptr;
int row_inc = s->frame->linesize[0];
- uint8_t r, g, b;
+ uint8_t b;
+ uint16_t rg;
uint8_t *rgb = s->frame->data[0];
int pixel_limit = s->frame->linesize[0] * s->avctx->height;
@@ -318,25 +319,31 @@ static void qtrle_decode_24bpp(QtrleContext *s, int row_ptr, int lines_to_change
} else if (rle_code < 0) {
/* decode the run length code */
rle_code = -rle_code;
- r = bytestream2_get_byte(&s->g);
- g = bytestream2_get_byte(&s->g);
+ rg = bytestream2_get_ne16(&s->g);
b = bytestream2_get_byte(&s->g);
CHECK_PIXEL_PTR(rle_code * 3);
while (rle_code--) {
- rgb[pixel_ptr++] = r;
- rgb[pixel_ptr++] = g;
- rgb[pixel_ptr++] = b;
+ AV_WN16A(rgb + pixel_ptr, rg);
+ rgb[pixel_ptr + 2] = b;
+ pixel_ptr += 3;
}
} else {
CHECK_PIXEL_PTR(rle_code * 3);
- /* copy pixels directly to output */
- while (rle_code--) {
- rgb[pixel_ptr++] = bytestream2_get_byte(&s->g);
- rgb[pixel_ptr++] = bytestream2_get_byte(&s->g);
- rgb[pixel_ptr++] = bytestream2_get_byte(&s->g);
+ rle_code_half = rle_code / 2;
+
+ while (rle_code_half--) { /* copy 2 raw rgb value at the same time */
+ AV_WN32A(rgb + pixel_ptr, bytestream2_get_ne32(&s->g)); /* rgbr */
+ AV_WN16A(rgb + pixel_ptr + 4, bytestream2_get_ne16(&s->g)); /* rgbr */
+ pixel_ptr += 6;
+ }
+
+ if (rle_code % 2 != 0){ /* not even raw value */
+ AV_WN16A(rgb + pixel_ptr, bytestream2_get_ne16(&s->g));
+ rgb[pixel_ptr + 2] = bytestream2_get_byte(&s->g);
+ pixel_ptr += 3;
}
}
}