/* * Apple Pixlet decoder * Copyright (c) 2016 Paul B Mahol * * This file is part of Libav. * * Libav is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * Libav is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with Libav; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #include <stdint.h> #include "libavutil/imgutils.h" #include "libavutil/intmath.h" #include "libavutil/opt.h" #include "avcodec.h" #include "bitstream.h" #include "bytestream.h" #include "internal.h" #include "thread.h" #include "unary.h" #define NB_LEVELS 4 #define PIXLET_MAGIC 0xDEADBEEF #define H 0 #define V 1 typedef struct SubBand { size_t width, height; size_t size; size_t x, y; } SubBand; typedef struct PixletContext { AVClass *class; GetByteContext gb; BitstreamContext bc; int levels; int depth; size_t w, h; int16_t *filter[2]; int16_t *prediction; int64_t scaling[4][2][NB_LEVELS]; SubBand band[4][NB_LEVELS * 3 + 1]; } PixletContext; static av_cold int pixlet_init(AVCodecContext *avctx) { avctx->pix_fmt = AV_PIX_FMT_YUV420P16; avctx->color_range = AVCOL_RANGE_JPEG; return 0; } static av_cold int pixlet_close(AVCodecContext *avctx) { PixletContext *ctx = avctx->priv_data; av_freep(&ctx->filter[0]); av_freep(&ctx->filter[1]); av_freep(&ctx->prediction); return 0; } static int init_decoder(AVCodecContext *avctx) { PixletContext *ctx = avctx->priv_data; int i, plane; ctx->filter[0] = av_malloc_array(ctx->h, sizeof(int16_t)); ctx->filter[1] = av_malloc_array(FFMAX(ctx->h, ctx->w) + 16, sizeof(int16_t)); ctx->prediction = av_malloc_array((ctx->w >> NB_LEVELS), sizeof(int16_t)); if (!ctx->filter[0] || !ctx->filter[1] || !ctx->prediction) return AVERROR(ENOMEM); for (plane = 0; plane < 3; plane++) { unsigned shift = plane > 0; size_t w = ctx->w >> shift; size_t h = ctx->h >> shift; ctx->band[plane][0].width = w >> NB_LEVELS; ctx->band[plane][0].height = h >> NB_LEVELS; ctx->band[plane][0].size = (w >> NB_LEVELS) * (h >> NB_LEVELS); for (i = 0; i < NB_LEVELS * 3; i++) { unsigned scale = ctx->levels - (i / 3); ctx->band[plane][i + 1].width = w >> scale; ctx->band[plane][i + 1].height = h >> scale; ctx->band[plane][i + 1].size = (w >> scale) * (h >> scale); ctx->band[plane][i + 1].x = (w >> scale) * (((i + 1) % 3) != 2); ctx->band[plane][i + 1].y = (h >> scale) * (((i + 1) % 3) != 1); } } return 0; } static int read_low_coeffs(AVCodecContext *avctx, int16_t *dst, size_t size, size_t width, ptrdiff_t stride) { PixletContext *ctx = avctx->priv_data; BitstreamContext *bc = &ctx->bc; unsigned cnt1, nbits, k, j = 0, i = 0; int64_t value, state = 3; int rlen, escape, flag = 0; while (i < size) { nbits = FFMIN(ff_clz((state >> 8) + 3) ^ 0x1F, 14); cnt1 = get_unary(bc, 0, 8); if (cnt1 < 8) { value = bitstream_read(bc, nbits); if (value <= 1) { bitstream_unget(bc, value & 1, 1); value = 1; } escape = value + ((1 << nbits) - 1) * cnt1 - 1; } else { escape = bitstream_read(bc, 16); } value = -((escape + flag) & 1) | 1; dst[j++] = value * ((escape + flag + 1) >> 1); i++; if (j == width) { j = 0; dst += stride; } state = 120 * (escape + flag) + state - (120 * state >> 8); flag = 0; if (state * 4 > 0xFF || i >= size) continue; nbits = ((state + 8) >> 5) + (state ? ff_clz(state) : 32) - 24; escape = av_mod_uintp2(16383, nbits); cnt1 = get_unary(bc, 0, 8); if (cnt1 > 7) { rlen = bitstream_read(bc, 16); } else { value = bitstream_read(bc, nbits); if (value <= 1) { bitstream_unget(bc, value & 1, 1); value = 1; } rlen = value + escape * cnt1 - 1; } if (i + rlen > size) return AVERROR_INVALIDDATA; i += rlen; for (k = 0; k < rlen; k++) { dst[j++] = 0; if (j == width) { j = 0; dst += stride; } } state = 0; flag = rlen < 0xFFFF ? 1 : 0; } bitstream_align(bc); return bitstream_tell(bc) >> 3; } static int read_high_coeffs(AVCodecContext *avctx, uint8_t *src, int16_t *dst, int size, int64_t c, int a, int64_t d, int width, ptrdiff_t stride) { PixletContext *ctx = avctx->priv_data; BitstreamContext *bc = &ctx->bc; unsigned cnt1, shbits, rlen, nbits, length, i = 0, j = 0, k; int ret, escape, pfx, cthulu, yflag, xflag, flag = 0; int64_t state = 3, value, tmp; ret = bitstream_init8(bc, src, bytestream2_get_bytes_left(&ctx->gb)); if (ret < 0) return ret; cthulu = (a >= 0) + (a ^ (a >> 31)) - (a >> 31); if (cthulu != 1) { nbits = 33 - ff_clz(cthulu - 1); if (nbits > 16) return AVERROR_INVALIDDATA; } else { nbits = 1; } length = 25 - nbits; while (i < size) { if (state >> 8 != -3) value = ff_clz((state >> 8) + 3) ^ 0x1F; else value = -1; cnt1 = get_unary(bc, 0, length); if (cnt1 >= length) { cnt1 = bitstream_read(bc, nbits); } else { pfx = 14 + (((value - 14) >> 32) & (value - 14)); cnt1 *= (1 << pfx) - 1; shbits = bitstream_read(bc, pfx); if (shbits <= 1) { bitstream_unget(bc, shbits & 1, 1); shbits = 1; } cnt1 += shbits - 1; } xflag = flag + cnt1; yflag = xflag; if (flag + cnt1 == 0) { value = 0; } else { xflag &= 1u; tmp = c * ((yflag + 1) >> 1) + (c >> 1); value = xflag + (tmp ^ -xflag); } i++; dst[j++] = value; if (j == width) { j = 0; dst += stride; } state += d * yflag - (d * state >> 8); flag = 0; if (state * 4 > 0xFF || i >= size) continue; pfx = ((state + 8) >> 5) + (state ? ff_clz(state) : 32) - 24; escape = av_mod_uintp2(16383, pfx); cnt1 = get_unary(bc, 0, 8); if (cnt1 < 8) { if (pfx < 1 || pfx > 25) return AVERROR_INVALIDDATA; value = bitstream_read(bc, pfx); if (value <= 1) { bitstream_unget(bc, value & 1, 1); value = 1; } rlen = value + escape * cnt1 - 1; } else { if (bitstream_read_bit(bc)) value = bitstream_read(bc, 16); else value = bitstream_read(bc, 8); rlen = value + 8 * escape; } if (rlen > 0xFFFF || i + rlen > size) return AVERROR_INVALIDDATA; i += rlen; for (k = 0; k < rlen; k++) { dst[j++] = 0; if (j == width) { j = 0; dst += stride; } } state = 0; flag = rlen < 0xFFFF ? 1 : 0; } bitstream_align(bc); return bitstream_tell(bc) >> 3; } static int read_highpass(AVCodecContext *avctx, uint8_t *ptr, int plane, AVFrame *frame) { PixletContext *ctx = avctx->priv_data; ptrdiff_t stride = frame->linesize[plane] / 2; int i, ret; for (i = 0; i < ctx->levels * 3; i++) { int32_t a = bytestream2_get_be32(&ctx->gb); int32_t b = bytestream2_get_be32(&ctx->gb); int32_t c = bytestream2_get_be32(&ctx->gb); int32_t d = bytestream2_get_be32(&ctx->gb); int16_t *dest = (int16_t *)frame->data[plane] + ctx->band[plane][i + 1].x + ctx->band[plane][i + 1].y * stride; size_t size = ctx->band[plane][i + 1].size; uint32_t magic = bytestream2_get_be32(&ctx->gb); if (magic != PIXLET_MAGIC) { av_log(avctx, AV_LOG_ERROR, "wrong magic number: 0x%"PRIX32" for plane %d, band %d\n", magic, plane, i); return AVERROR_INVALIDDATA; } ret = read_high_coeffs(avctx, ptr + bytestream2_tell(&ctx->gb), dest, size, c, (b >= FFABS(a)) ? b : a, d, ctx->band[plane][i + 1].width, stride); if (ret < 0) { av_log(avctx, AV_LOG_ERROR, "error in highpass coefficients for plane %d, band %d\n", plane, i); return ret; } bytestream2_skip(&ctx->gb, ret); } return 0; } static void line_add_sat_s16(int16_t *dst, const int16_t *src, size_t len) { int i; for (i = 0; i < len; i++) { int val = dst[i] + src[i]; dst[i] = av_clip_int16(val); } } static void lowpass_prediction(int16_t *dst, int16_t *pred, size_t width, size_t height, ptrdiff_t stride) { int i, j; memset(pred, 0, width * sizeof(*pred)); for (i = 0; i < height; i++) { line_add_sat_s16(pred, dst, width); dst[0] = pred[0]; for (j = 1; j < width; j++) dst[j] = pred[j] + dst[j - 1]; dst += stride; } } static void filterfn(int16_t *dest, int16_t *tmp, size_t size, int64_t scale) { int16_t *low, *high, *ll, *lh, *hl, *hh; int hsize, i, j; int64_t value; hsize = size >> 1; low = tmp + 4; high = &low[hsize + 8]; memcpy(low, dest, size); memcpy(high, dest + hsize, size); ll = &low[hsize]; lh = &low[hsize]; hl = &high[hsize]; hh = hl; for (i = 4, j = 2; i; i--, j++, ll--, hh++, lh++, hl--) { low[i - 5] = low[j - 1]; lh[0] = ll[-1]; high[i - 5] = high[j - 2]; hh[0] = hl[-2]; } for (i = 0; i < hsize; i++) { value = (int64_t) low [i + 1] * -INT64_C(325392907) + (int64_t) low [i + 0] * INT64_C(3687786320) + (int64_t) low [i - 1] * -INT64_C(325392907) + (int64_t) high[i + 0] * INT64_C(1518500249) + (int64_t) high[i - 1] * INT64_C(1518500249); dest[i * 2] = av_clip_int16(((value >> 32) * scale) >> 32); } for (i = 0; i < hsize; i++) { value = (int64_t) low [i + 2] * -INT64_C(65078576) + (int64_t) low [i + 1] * INT64_C(1583578880) + (int64_t) low [i + 0] * INT64_C(1583578880) + (int64_t) low [i - 1] * -INT64_C(65078576) + (int64_t) high[i + 1] * INT64_C(303700064) + (int64_t) high[i + 0] * -INT64_C(3644400640) + (int64_t) high[i - 1] * INT64_C(303700064); dest[i * 2 + 1] = av_clip_int16(((value >> 32) * scale) >> 32); } } static void reconstruction(AVCodecContext *avctx, int16_t *dest, size_t width, size_t height, ptrdiff_t stride, int64_t *scaling_h, int64_t *scaling_v) { PixletContext *ctx = avctx->priv_data; unsigned scaled_width, scaled_height; int16_t *ptr, *tmp; int i, j, k; scaled_width = width >> NB_LEVELS; scaled_height = height >> NB_LEVELS; tmp = ctx->filter[0]; for (i = 0; i < NB_LEVELS; i++) { int64_t scale_v = scaling_v[i]; int64_t scale_h = scaling_h[i]; scaled_width <<= 1; scaled_height <<= 1; ptr = dest; for (j = 0; j < scaled_height; j++) { filterfn(ptr, ctx->filter[1], scaled_width, scale_v); ptr += stride; } for (j = 0; j < scaled_width; j++) { ptr = dest + j; for (k = 0; k < scaled_height; k++) { tmp[k] = *ptr; ptr += stride; } filterfn(tmp, ctx->filter[1], scaled_height, scale_h); ptr = dest + j; for (k = 0; k < scaled_height; k++) { *ptr = tmp[k]; ptr += stride; } } } } static void postprocess_luma(AVFrame *frame, size_t w, size_t h, int depth) { uint16_t *dsty = (uint16_t *)frame->data[0]; int16_t *srcy = (int16_t *)frame->data[0]; ptrdiff_t stridey = frame->linesize[0] / 2; int i, j; for (j = 0; j < h; j++) { for (i = 0; i < w; i++) { if (srcy[i] <= 0) dsty[i] = 0; else if (srcy[i] > ((1 << depth) - 1)) dsty[i] = 65535; else dsty[i] = ((int64_t) srcy[i] * srcy[i] * 65535) / ((1 << depth) - 1) / ((1 << depth) - 1); } dsty += stridey; srcy += stridey; } } static void postprocess_chroma(AVFrame *frame, int w, int h, int depth) { uint16_t *dstu = (uint16_t *)frame->data[1]; uint16_t *dstv = (uint16_t *)frame->data[2]; int16_t *srcu = (int16_t *)frame->data[1]; int16_t *srcv = (int16_t *)frame->data[2]; ptrdiff_t strideu = frame->linesize[1] / 2; ptrdiff_t stridev = frame->linesize[2] / 2; const unsigned add = 1 << (depth - 1); const unsigned shift = 16 - depth; int i, j; for (j = 0; j < h; j++) { for (i = 0; i < w; i++) { dstu[i] = av_clip_uintp2_c(add + srcu[i], depth) << shift; dstv[i] = av_clip_uintp2_c(add + srcv[i], depth) << shift; } dstu += strideu; dstv += stridev; srcu += strideu; srcv += stridev; } } static int decode_plane(AVCodecContext *avctx, int plane, AVPacket *avpkt, AVFrame *frame) { PixletContext *ctx = avctx->priv_data; ptrdiff_t stride = frame->linesize[plane] / 2; unsigned shift = plane > 0; int16_t *dst; int i, ret; for (i = ctx->levels - 1; i >= 0; i--) { int32_t h = sign_extend(bytestream2_get_be32(&ctx->gb), 32); int32_t v = sign_extend(bytestream2_get_be32(&ctx->gb), 32); if (!h || !v) return AVERROR_INVALIDDATA; ctx->scaling[plane][H][i] = (1000000ULL << 32) / h; ctx->scaling[plane][V][i] = (1000000ULL << 32) / v; } bytestream2_skip(&ctx->gb, 4); dst = (int16_t *)frame->data[plane]; dst[0] = sign_extend(bytestream2_get_be16(&ctx->gb), 16); ret = bitstream_init8(&ctx->bc, avpkt->data + bytestream2_tell(&ctx->gb), bytestream2_get_bytes_left(&ctx->gb)); if (ret < 0) return ret; ret = read_low_coeffs(avctx, dst + 1, ctx->band[plane][0].width - 1, ctx->band[plane][0].width - 1, 0); if (ret < 0) { av_log(avctx, AV_LOG_ERROR, "error in lowpass coefficients for plane %d, top row\n", plane); return ret; } ret = read_low_coeffs(avctx, dst + stride, ctx->band[plane][0].height - 1, 1, stride); if (ret < 0) { av_log(avctx, AV_LOG_ERROR, "error in lowpass coefficients for plane %d, left column\n", plane); return ret; } ret = read_low_coeffs(avctx, dst + stride + 1, (ctx->band[plane][0].width - 1) * (ctx->band[plane][0].height - 1), ctx->band[plane][0].width - 1, stride); if (ret < 0) { av_log(avctx, AV_LOG_ERROR, "error in lowpass coefficients for plane %d, rest\n", plane); return ret; } bytestream2_skip(&ctx->gb, ret); if (bytestream2_get_bytes_left(&ctx->gb) <= 0) { av_log(avctx, AV_LOG_ERROR, "no bytes left\n"); return AVERROR_INVALIDDATA; } ret = read_highpass(avctx, avpkt->data, plane, frame); if (ret < 0) return ret; lowpass_prediction(dst, ctx->prediction, ctx->band[plane][0].width, ctx->band[plane][0].height, stride); reconstruction(avctx, (int16_t *)frame->data[plane], ctx->w >> shift, ctx->h >> shift, stride, ctx->scaling[plane][H], ctx->scaling[plane][V]); return 0; } static int pixlet_decode_frame(AVCodecContext *avctx, void *data, int *got_frame, AVPacket *avpkt) { PixletContext *ctx = avctx->priv_data; int i, w, h, width, height, ret, version; AVFrame *p = data; ThreadFrame frame = { .f = data }; uint32_t pktsize; bytestream2_init(&ctx->gb, avpkt->data, avpkt->size); pktsize = bytestream2_get_be32(&ctx->gb); if (pktsize <= 44 || pktsize - 4 > bytestream2_get_bytes_left(&ctx->gb)) { av_log(avctx, AV_LOG_ERROR, "Invalid packet size %"PRIu32".\n", pktsize); return AVERROR_INVALIDDATA; } version = bytestream2_get_le32(&ctx->gb); if (version != 1) avpriv_request_sample(avctx, "Version %d", version); bytestream2_skip(&ctx->gb, 4); if (bytestream2_get_be32(&ctx->gb) != 1) return AVERROR_INVALIDDATA; bytestream2_skip(&ctx->gb, 4); width = bytestream2_get_be32(&ctx->gb); height = bytestream2_get_be32(&ctx->gb); w = FFALIGN(width, 1 << (NB_LEVELS + 1)); h = FFALIGN(height, 1 << (NB_LEVELS + 1)); ctx->levels = bytestream2_get_be32(&ctx->gb); if (ctx->levels != NB_LEVELS) return AVERROR_INVALIDDATA; ctx->depth = bytestream2_get_be32(&ctx->gb); if (ctx->depth < 8 || ctx->depth > 15) { avpriv_request_sample(avctx, "Depth %d", ctx->depth); return AVERROR_INVALIDDATA; } ret = ff_set_dimensions(avctx, w, h); if (ret < 0) return ret; avctx->width = width; avctx->height = height; /* reinit should dimensions change */ if (ctx->w != w || ctx->h != h) { pixlet_close(avctx); ctx->w = w; ctx->h = h; ret = init_decoder(avctx); if (ret < 0) { pixlet_close(avctx); ctx->w = 0; ctx->h = 0; return ret; } } bytestream2_skip(&ctx->gb, 8); ret = ff_thread_get_buffer(avctx, &frame, 0); if (ret < 0) return ret; for (i = 0; i < 3; i++) { ret = decode_plane(avctx, i, avpkt, frame.f); if (ret < 0) return ret; if (avctx->flags & AV_CODEC_FLAG_GRAY) break; } postprocess_luma(frame.f, ctx->w, ctx->h, ctx->depth); postprocess_chroma(frame.f, ctx->w >> 1, ctx->h >> 1, ctx->depth); p->pict_type = AV_PICTURE_TYPE_I; p->color_range = AVCOL_RANGE_JPEG; p->key_frame = 1; *got_frame = 1; return pktsize; } #if HAVE_THREADS static int pixlet_init_thread_copy(AVCodecContext *avctx) { PixletContext *ctx = avctx->priv_data; ctx->filter[0] = NULL; ctx->filter[1] = NULL; ctx->prediction = NULL; ctx->w = 0; ctx->h = 0; return 0; } #endif /* HAVE_THREADS */ AVCodec ff_pixlet_decoder = { .name = "pixlet", .long_name = NULL_IF_CONFIG_SMALL("Apple Pixlet"), .type = AVMEDIA_TYPE_VIDEO, .id = AV_CODEC_ID_PIXLET, .init = pixlet_init, .init_thread_copy = ONLY_IF_THREADS_ENABLED(pixlet_init_thread_copy), .close = pixlet_close, .decode = pixlet_decode_frame, .priv_data_size = sizeof(PixletContext), .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS, .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE | FF_CODEC_CAP_INIT_CLEANUP, };