diff options
author | Paul B Mahol <onemda@gmail.com> | 2021-02-09 19:17:27 +0100 |
---|---|---|
committer | Paul B Mahol <onemda@gmail.com> | 2021-02-24 17:14:03 +0100 |
commit | d69f4be1c6c6e305b4f32235bcab35dcc8c9c98b (patch) | |
tree | bd19357ad2c7bae53f68d5fd31c7e0a7547c22dc /libavcodec/cfhdenc.c | |
parent | 767d3f7dcf818a88b7fa9c510b8721f247faee3c (diff) | |
download | ffmpeg-d69f4be1c6c6e305b4f32235bcab35dcc8c9c98b.tar.gz |
avcodec/cfhdenc: refactor DSP code for CFHD encoder
This is needed to implement x86 SIMD.
Diffstat (limited to 'libavcodec/cfhdenc.c')
-rw-r--r-- | libavcodec/cfhdenc.c | 123 |
1 files changed, 33 insertions, 90 deletions
diff --git a/libavcodec/cfhdenc.c b/libavcodec/cfhdenc.c index 7b6b3c92f2..370b1e5063 100644 --- a/libavcodec/cfhdenc.c +++ b/libavcodec/cfhdenc.c @@ -33,6 +33,7 @@ #include "avcodec.h" #include "bytestream.h" #include "cfhd.h" +#include "cfhdencdsp.h" #include "put_bits.h" #include "internal.h" #include "thread.h" @@ -239,6 +240,8 @@ typedef struct CFHDEncContext { Runbook rb[321]; Codebook cb[513]; int16_t *alpha; + + CFHDEncDSPContext dsp; } CFHDEncContext; static av_cold int cfhd_encode_init(AVCodecContext *avctx) @@ -359,6 +362,8 @@ static av_cold int cfhd_encode_init(AVCodecContext *avctx) s->lut[i] = last; } + ff_cfhdencdsp_init(&s->dsp); + if (s->planes != 4) return 0; @@ -369,42 +374,6 @@ static av_cold int cfhd_encode_init(AVCodecContext *avctx) return 0; } -static av_always_inline void filter(int16_t *input, ptrdiff_t in_stride, - int16_t *low, ptrdiff_t low_stride, - int16_t *high, ptrdiff_t high_stride, - int len) -{ - low[(0>>1) * low_stride] = av_clip_int16(input[0*in_stride] + input[1*in_stride]); - high[(0>>1) * high_stride] = av_clip_int16((5 * input[0*in_stride] - 11 * input[1*in_stride] + - 4 * input[2*in_stride] + 4 * input[3*in_stride] - - 1 * input[4*in_stride] - 1 * input[5*in_stride] + 4) >> 3); - - for (int i = 2; i < len - 2; i += 2) { - low[(i>>1) * low_stride] = av_clip_int16(input[i*in_stride] + input[(i+1)*in_stride]); - high[(i>>1) * high_stride] = av_clip_int16(((-input[(i-2)*in_stride] - input[(i-1)*in_stride] + - input[(i+2)*in_stride] + input[(i+3)*in_stride] + 4) >> 3) + - input[(i+0)*in_stride] - input[(i+1)*in_stride]); - } - - low[((len-2)>>1) * low_stride] = av_clip_int16(input[((len-2)+0)*in_stride] + input[((len-2)+1)*in_stride]); - high[((len-2)>>1) * high_stride] = av_clip_int16((11* input[((len-2)+0)*in_stride] - 5 * input[((len-2)+1)*in_stride] - - 4 * input[((len-2)-1)*in_stride] - 4 * input[((len-2)-2)*in_stride] + - 1 * input[((len-2)-3)*in_stride] + 1 * input[((len-2)-4)*in_stride] + 4) >> 3); -} - -static void horiz_filter(int16_t *input, int16_t *low, int16_t *high, - int width) -{ - filter(input, 1, low, 1, high, 1, width); -} - -static void vert_filter(int16_t *input, ptrdiff_t in_stride, - int16_t *low, ptrdiff_t low_stride, - int16_t *high, ptrdiff_t high_stride, int len) -{ - filter(input, in_stride, low, low_stride, high, high_stride, len); -} - static void quantize_band(int16_t *input, int width, int a_width, int height, unsigned quantization) { @@ -454,6 +423,7 @@ static int cfhd_encode_frame(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *frame, int *got_packet) { CFHDEncContext *s = avctx->priv_data; + CFHDEncDSPContext *dsp = &s->dsp; PutByteContext *pby = &s->pby; PutBitContext *pb = &s->pb; const Codebook *const cb = s->cb; @@ -480,12 +450,9 @@ static int cfhd_encode_frame(AVCodecContext *avctx, AVPacket *pkt, in_stride = avctx->width; } - for (int i = 0; i < height * 2; i++) { - horiz_filter(input, low, high, width * 2); - input += in_stride; - low += a_width; - high += a_width; - } + dsp->horiz_filter(input, low, high, + in_stride, a_width, a_width, + width * 2, height * 2); input = s->plane[plane].l_h[7]; low = s->plane[plane].subband[7]; @@ -493,23 +460,17 @@ static int cfhd_encode_frame(AVCodecContext *avctx, AVPacket *pkt, high = s->plane[plane].subband[9]; high_stride = s->plane[plane].band[2][0].a_width; - for (int i = 0; i < width; i++) { - vert_filter(input, a_width, low, low_stride, high, high_stride, height * 2); - input++; - low++; - high++; - } + dsp->vert_filter(input, low, high, + a_width, low_stride, high_stride, + width, height * 2); input = s->plane[plane].l_h[6]; low = s->plane[plane].l_h[7]; high = s->plane[plane].subband[8]; - for (int i = 0; i < width; i++) { - vert_filter(input, a_width, low, low_stride, high, high_stride, height * 2); - input++; - low++; - high++; - } + dsp->vert_filter(input, low, high, + a_width, low_stride, high_stride, + width, height * 2); a_width = s->plane[plane].band[1][0].a_width; width = s->plane[plane].band[1][0].width; @@ -527,34 +488,25 @@ static int cfhd_encode_frame(AVCodecContext *avctx, AVPacket *pkt, } input = s->plane[plane].l_h[7]; - for (int i = 0; i < height * 2; i++) { - horiz_filter(input, low, high, width * 2); - input += a_width * 2; - low += low_stride; - high += high_stride; - } + dsp->horiz_filter(input, low, high, + a_width * 2, low_stride, high_stride, + width * 2, height * 2); input = s->plane[plane].l_h[4]; low = s->plane[plane].subband[4]; high = s->plane[plane].subband[6]; - for (int i = 0; i < width; i++) { - vert_filter(input, a_width, low, low_stride, high, high_stride, height * 2); - input++; - low++; - high++; - } + dsp->vert_filter(input, low, high, + a_width, low_stride, high_stride, + width, height * 2); input = s->plane[plane].l_h[3]; low = s->plane[plane].l_h[4]; high = s->plane[plane].subband[5]; - for (int i = 0; i < width; i++) { - vert_filter(input, a_width, low, low_stride, high, high_stride, height * 2); - input++; - low++; - high++; - } + dsp->vert_filter(input, low, high, + a_width, low_stride, high_stride, + width, height * 2); a_width = s->plane[plane].band[0][0].a_width; width = s->plane[plane].band[0][0].width; @@ -574,34 +526,25 @@ static int cfhd_encode_frame(AVCodecContext *avctx, AVPacket *pkt, } input = s->plane[plane].l_h[4]; - for (int i = 0; i < height * 2; i++) { - horiz_filter(input, low, high, width * 2); - input += a_width * 2; - low += low_stride; - high += high_stride; - } + dsp->horiz_filter(input, low, high, + a_width * 2, low_stride, high_stride, + width * 2, height * 2); low = s->plane[plane].subband[1]; high = s->plane[plane].subband[3]; input = s->plane[plane].l_h[1]; - for (int i = 0; i < width; i++) { - vert_filter(input, a_width, low, low_stride, high, high_stride, height * 2); - input++; - low++; - high++; - } + dsp->vert_filter(input, low, high, + a_width, low_stride, high_stride, + width, height * 2); low = s->plane[plane].subband[0]; high = s->plane[plane].subband[2]; input = s->plane[plane].l_h[0]; - for (int i = 0; i < width; i++) { - vert_filter(input, a_width, low, low_stride, high, high_stride, height * 2); - input++; - low++; - high++; - } + dsp->vert_filter(input, low, high, + a_width, low_stride, high_stride, + width, height * 2); } ret = ff_alloc_packet2(avctx, pkt, 64LL + s->planes * (2LL * avctx->width * avctx->height + 1000LL), 0); |