summaryrefslogtreecommitdiffstats
path: root/libavcodec/vulkan/ffv1_enc_setup.comp
blob: 5f8e6704b0aaaf82d76d538ded9ef3a99e6cbd8e (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
/*
 * FFv1 codec
 *
 * Copyright (c) 2024 Lynne <[email protected]>
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

uint8_t state[CONTEXT_SIZE];

void init_slice(inout SliceContext sc, const uint slice_idx)
{
    /* Set coordinates */
    uvec2 img_size = imageSize(src[0]);
    uint sxs = slice_coord(img_size.x, gl_WorkGroupID.x + 0,
                           gl_NumWorkGroups.x, chroma_shift.x);
    uint sxe = slice_coord(img_size.x, gl_WorkGroupID.x + 1,
                           gl_NumWorkGroups.x, chroma_shift.x);
    uint sys = slice_coord(img_size.y, gl_WorkGroupID.y + 0,
                           gl_NumWorkGroups.y, chroma_shift.y);
    uint sye = slice_coord(img_size.y, gl_WorkGroupID.y + 1,
                           gl_NumWorkGroups.y, chroma_shift.y);

    sc.slice_pos = ivec2(sxs, sys);
    sc.slice_dim = ivec2(sxe - sxs, sye - sys);
    sc.slice_coding_mode = int(force_pcm == 1);
    sc.slice_reset_contexts = sc.slice_coding_mode == 1;
    sc.quant_table_idx = u8vec3(context_model);

    if ((rct_search == 0) || (sc.slice_coding_mode == 1))
        sc.slice_rct_coef = ivec2(1, 1);

    rac_init(sc.c,
             OFFBUF(u8buf, out_data, slice_idx * slice_size_max),
             slice_size_max);
}

void put_usymbol(inout RangeCoder c, uint v)
{
    bool is_nil = (v == 0);
    put_rac_direct(c, state[0], is_nil);
    if (is_nil)
        return;

    const int e = findMSB(v);

    for (int i = 0; i < e; i++)
        put_rac_direct(c, state[1 + min(i, 9)], true);
    put_rac_direct(c, state[1 + min(e, 9)], false);

    for (int i = e - 1; i >= 0; i--)
        put_rac_direct(c, state[22 + min(i, 9)], bool(bitfieldExtract(v, i, 1)));
}

void write_slice_header(inout SliceContext sc)
{
    [[unroll]]
    for (int i = 0; i < CONTEXT_SIZE; i++)
        state[i] = uint8_t(128);

    put_usymbol(sc.c, gl_WorkGroupID.x);
    put_usymbol(sc.c, gl_WorkGroupID.y);
    put_usymbol(sc.c, 0);
    put_usymbol(sc.c, 0);

    for (int i = 0; i < codec_planes; i++)
        put_usymbol(sc.c, sc.quant_table_idx[i]);

    put_usymbol(sc.c, pic_mode);
    put_usymbol(sc.c, sar.x);
    put_usymbol(sc.c, sar.y);

    if (version >= 4) {
        put_rac_direct(sc.c, state[0], sc.slice_reset_contexts);
        put_usymbol(sc.c, sc.slice_coding_mode);
        if (sc.slice_coding_mode != 1 && colorspace == 1) {
            put_usymbol(sc.c, sc.slice_rct_coef.y);
            put_usymbol(sc.c, sc.slice_rct_coef.x);
        }
    }
}

void write_frame_header(inout SliceContext sc)
{
    put_rac_equi(sc.c, bool(key_frame));
}

#ifdef GOLOMB
void init_golomb(inout SliceContext sc)
{
    sc.hdr_len = rac_terminate(sc.c);
    init_put_bits(sc.pb,
                  OFFBUF(u8buf, sc.c.bytestream_start, sc.hdr_len),
                  slice_size_max - sc.hdr_len);
}
#endif

void main(void)
{
    const uint slice_idx = gl_WorkGroupID.y*gl_NumWorkGroups.x + gl_WorkGroupID.x;

    init_slice(slice_ctx[slice_idx], slice_idx);

    if (slice_idx == 0)
        write_frame_header(slice_ctx[slice_idx]);

    write_slice_header(slice_ctx[slice_idx]);

#ifdef GOLOMB
    init_golomb(slice_ctx[slice_idx]);
#endif
}