1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
|
/*
* VVC CTU(Coding Tree Unit) parser
*
* Copyright (C) 2022 Nuo Mi
*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#ifndef AVCODEC_VVC_CTU_H
#define AVCODEC_VVC_CTU_H
#include "libavcodec/cabac.h"
#include "libavutil/mem_internal.h"
#include "dec.h"
#define MAX_CTU_SIZE 128
#define MAX_CU_SIZE MAX_CTU_SIZE
#define MIN_CU_SIZE 4
#define MIN_CU_LOG2 2
#define MAX_CU_DEPTH 7
#define MAX_PARTS_IN_CTU ((MAX_CTU_SIZE >> MIN_CU_LOG2) * (MAX_CTU_SIZE >> MIN_CU_LOG2))
#define MIN_PU_SIZE 4
#define MAX_TB_SIZE 64
#define MIN_TU_SIZE 4
#define MAX_TUS_IN_CU 64
#define MAX_QP 63
#define MAX_PB_SIZE 128
#define EDGE_EMU_BUFFER_STRIDE (MAX_PB_SIZE + 32)
#define CHROMA_EXTRA_BEFORE 1
#define CHROMA_EXTRA_AFTER 2
#define CHROMA_EXTRA 3
#define LUMA_EXTRA_BEFORE 3
#define LUMA_EXTRA_AFTER 4
#define LUMA_EXTRA 7
#define BILINEAR_EXTRA_BEFORE 0
#define BILINEAR_EXTRA_AFTER 1
#define BILINEAR_EXTRA 1
#define SCALED_INT(pos) ((pos) >> 10)
#define MAX_CONTROL_POINTS 3
#define AFFINE_MIN_BLOCK_SIZE 4
#define MRG_MAX_NUM_CANDS 6
#define MAX_NUM_HMVP_CANDS 5
#define SAO_PADDING_SIZE 1
#define ALF_PADDING_SIZE 8
#define ALF_BLOCK_SIZE 4
#define ALF_BORDER_LUMA 3
#define ALF_BORDER_CHROMA 2
#define ALF_VB_POS_ABOVE_LUMA 4
#define ALF_VB_POS_ABOVE_CHROMA 2
#define ALF_GRADIENT_STEP 2
#define ALF_GRADIENT_BORDER 2
#define ALF_GRADIENT_SIZE ((MAX_CU_SIZE + ALF_GRADIENT_BORDER * 2) / ALF_GRADIENT_STEP)
#define ALF_NUM_DIR 4
/**
* Value of the luma sample at position (x, y) in the 2D array tab.
*/
#define SAMPLE(tab, x, y) ((tab)[(y) * s->pps->width + (x)])
#define SAMPLE_CTB(tab, x, y) ((tab)[(y) * min_cb_width + (x)])
#define CTB(tab, x, y) ((tab)[(y) * fc->ps.pps->ctb_width + (x)])
enum SAOType {
SAO_NOT_APPLIED = 0,
SAO_BAND,
SAO_EDGE,
};
enum SAOEOClass {
SAO_EO_HORIZ = 0,
SAO_EO_VERT,
SAO_EO_135D,
SAO_EO_45D,
};
typedef struct NeighbourAvailable {
int cand_left;
int cand_up;
int cand_up_left;
int cand_up_right;
int cand_up_right_sap;
} NeighbourAvailable;
enum IspType{
ISP_NO_SPLIT,
ISP_HOR_SPLIT,
ISP_VER_SPLIT,
};
typedef enum VVCSplitMode {
SPLIT_NONE,
SPLIT_TT_HOR,
SPLIT_BT_HOR,
SPLIT_TT_VER,
SPLIT_BT_VER,
SPLIT_QT,
} VVCSplitMode;
typedef enum MtsIdx {
MTS_DCT2_DCT2,
MTS_DST7_DST7,
MTS_DST7_DCT8,
MTS_DCT8_DST7,
MTS_DCT8_DCT8,
} MtsIdx;
typedef struct TransformBlock {
uint8_t has_coeffs;
uint8_t c_idx;
uint8_t ts; ///< transform_skip_flag
int x0;
int y0;
int tb_width;
int tb_height;
int log2_tb_width;
int log2_tb_height;
int max_scan_x;
int max_scan_y;
int min_scan_x;
int min_scan_y;
int qp;
int rect_non_ts_flag;
int bd_shift;
int bd_offset;
int *coeffs;
} TransformBlock;
typedef enum VVCTreeType {
SINGLE_TREE,
DUAL_TREE_LUMA,
DUAL_TREE_CHROMA,
} VVCTreeType;
typedef struct TransformUnit {
int x0;
int y0;
int width;
int height;
uint8_t joint_cbcr_residual_flag; ///< tu_joint_cbcr_residual_flag
uint8_t coded_flag[VVC_MAX_SAMPLE_ARRAYS]; ///< tu_y_coded_flag, tu_cb_coded_flag, tu_cr_coded_flag
uint8_t nb_tbs;
TransformBlock tbs[VVC_MAX_SAMPLE_ARRAYS];
struct TransformUnit *next; ///< RefStruct reference
} TransformUnit;
typedef enum PredMode {
MODE_INTER,
MODE_INTRA,
MODE_SKIP,
MODE_PLT,
MODE_IBC,
} PredMode;
typedef struct Mv {
int x; ///< horizontal component of motion vector
int y; ///< vertical component of motion vector
} Mv;
typedef struct MvField {
DECLARE_ALIGNED(8, Mv, mv)[2]; ///< mvL0, vvL1
int8_t ref_idx[2]; ///< refIdxL0, refIdxL1
uint8_t hpel_if_idx; ///< hpelIfIdx
uint8_t bcw_idx; ///< bcwIdx
uint8_t pred_flag;
uint8_t ciip_flag; ///< ciip_flag
} MvField;
typedef struct DMVRInfo {
DECLARE_ALIGNED(8, Mv, mv)[2]; ///< mvL0, vvL1
uint8_t dmvr_enabled;
} DMVRInfo;
typedef enum MotionModelIdc {
MOTION_TRANSLATION,
MOTION_4_PARAMS_AFFINE,
MOTION_6_PARAMS_AFFINE,
} MotionModelIdc;
typedef enum PredFlag {
PF_INTRA = 0x0,
PF_L0 = 0x1,
PF_L1 = 0x2,
PF_BI = 0x3,
PF_IBC = PF_L0 | 0x4,
} PredFlag;
typedef enum IntraPredMode {
INTRA_INVALID = -1,
INTRA_PLANAR = 0,
INTRA_DC,
INTRA_HORZ = 18,
INTRA_DIAG = 34,
INTRA_VERT = 50,
INTRA_VDIAG = 66,
INTRA_LT_CCLM = 81,
INTRA_L_CCLM,
INTRA_T_CCLM
} IntraPredMode;
typedef struct MotionInfo {
MotionModelIdc motion_model_idc; ///< MotionModelIdc
int8_t ref_idx[2]; ///< refIdxL0, refIdxL1
uint8_t hpel_if_idx; ///< hpelIfIdx
uint8_t bcw_idx; ///< bcwIdx
PredFlag pred_flag;
Mv mv[2][MAX_CONTROL_POINTS];
int num_sb_x, num_sb_y;
} MotionInfo;
typedef struct PredictionUnit {
uint8_t general_merge_flag;
uint8_t mmvd_merge_flag;
//InterPredIdc inter_pred_idc;
uint8_t inter_affine_flag;
//subblock predict
uint8_t merge_subblock_flag;
uint8_t merge_gpm_flag;
uint8_t gpm_partition_idx;
MvField gpm_mv[2];
int sym_mvd_flag;
MotionInfo mi;
// for regular prediction only
uint8_t dmvr_flag;
uint8_t bdof_flag;
int16_t diff_mv_x[2][AFFINE_MIN_BLOCK_SIZE * AFFINE_MIN_BLOCK_SIZE]; ///< diffMvLX
int16_t diff_mv_y[2][AFFINE_MIN_BLOCK_SIZE * AFFINE_MIN_BLOCK_SIZE]; ///< diffMvLX
int cb_prof_flag[2];
} PredictionUnit;
typedef struct CodingUnit {
VVCTreeType tree_type;
int x0;
int y0;
int cb_width;
int cb_height;
int ch_type;
int cqt_depth;
uint8_t coded_flag;
uint8_t sbt_flag;
uint8_t sbt_horizontal_flag;
uint8_t sbt_pos_flag;
int lfnst_idx;
MtsIdx mts_idx;
uint8_t act_enabled_flag;
uint8_t intra_luma_ref_idx; ///< IntraLumaRefLineIdx[][]
uint8_t intra_mip_flag; ///< intra_mip_flag
uint8_t skip_flag; ///< cu_skip_flag;
//inter
uint8_t ciip_flag;
// Inferred parameters
enum IspType isp_split_type; ///< IntraSubPartitionsSplitType
enum PredMode pred_mode; ///< PredMode
int num_intra_subpartitions;
IntraPredMode intra_pred_mode_y; ///< IntraPredModeY
IntraPredMode intra_pred_mode_c; ///< IntraPredModeC
int mip_chroma_direct_flag; ///< MipChromaDirectFlag
int bdpcm_flag[VVC_MAX_SAMPLE_ARRAYS]; ///< BdpcmFlag
int apply_lfnst_flag[VVC_MAX_SAMPLE_ARRAYS]; ///< ApplyLfnstFlag[]
struct {
TransformUnit *head; ///< RefStruct reference
TransformUnit *tail; ///< RefStruct reference
} tus;
int8_t qp[4]; ///< QpY, Qp′Cb, Qp′Cr, Qp′CbCr
PredictionUnit pu;
struct CodingUnit *next; ///< RefStruct reference
} CodingUnit;
typedef struct CTU {
CodingUnit *cus;
int max_y[2][VVC_MAX_REF_ENTRIES];
int max_y_idx[2];
int has_dmvr;
} CTU;
typedef struct ReconstructedArea {
int x;
int y;
int w;
int h;
} ReconstructedArea;
typedef struct VVCCabacState {
uint16_t state[2];
uint8_t shift[2];
} VVCCabacState;
// VVC_CONTEXTS matched with SYNTAX_ELEMENT_LAST, it's checked by cabac_init_state.
#define VVC_CONTEXTS 378
typedef struct EntryPoint {
int8_t qp_y; ///< QpY
int stat_coeff[VVC_MAX_SAMPLE_ARRAYS]; ///< StatCoeff
VVCCabacState cabac_state[VVC_CONTEXTS];
CABACContext cc;
int ctu_start;
int ctu_end;
uint8_t is_first_qg; // first quantization group
MvField hmvp[MAX_NUM_HMVP_CANDS]; ///< HmvpCandList
int num_hmvp; ///< NumHmvpCand
MvField hmvp_ibc[MAX_NUM_HMVP_CANDS]; ///< HmvpIbcCandList
int num_hmvp_ibc; ///< NumHmvpIbcCand
} EntryPoint;
typedef struct VVCLocalContext {
uint8_t ctb_left_flag;
uint8_t ctb_up_flag;
uint8_t ctb_up_right_flag;
uint8_t ctb_up_left_flag;
int end_of_tiles_x;
int end_of_tiles_y;
/* +7 is for subpixel interpolation, *2 for high bit depths */
DECLARE_ALIGNED(32, uint8_t, edge_emu_buffer)[(MAX_PB_SIZE + 7) * EDGE_EMU_BUFFER_STRIDE * 2];
/* The extended size between the new edge emu buffer is abused by SAO */
DECLARE_ALIGNED(32, uint8_t, edge_emu_buffer2)[(MAX_PB_SIZE + 7) * EDGE_EMU_BUFFER_STRIDE * 2];
DECLARE_ALIGNED(32, int16_t, tmp)[MAX_PB_SIZE * MAX_PB_SIZE];
DECLARE_ALIGNED(32, int16_t, tmp1)[MAX_PB_SIZE * MAX_PB_SIZE];
DECLARE_ALIGNED(32, int16_t, tmp2)[MAX_PB_SIZE * MAX_PB_SIZE];
DECLARE_ALIGNED(32, uint8_t, ciip_tmp)[MAX_PB_SIZE * MAX_PB_SIZE * 2];
DECLARE_ALIGNED(32, uint8_t, sao_buffer)[(MAX_CTU_SIZE + 2 * SAO_PADDING_SIZE) * EDGE_EMU_BUFFER_STRIDE * 2];
DECLARE_ALIGNED(32, uint8_t, alf_buffer_luma)[(MAX_CTU_SIZE + 2 * ALF_PADDING_SIZE) * EDGE_EMU_BUFFER_STRIDE * 2];
DECLARE_ALIGNED(32, uint8_t, alf_buffer_chroma)[(MAX_CTU_SIZE + 2 * ALF_PADDING_SIZE) * EDGE_EMU_BUFFER_STRIDE * 2];
DECLARE_ALIGNED(32, int32_t, alf_gradient_tmp)[ALF_GRADIENT_SIZE * ALF_GRADIENT_SIZE * ALF_NUM_DIR];
struct {
int sbt_num_fourths_tb0; ///< SbtNumFourthsTb0
uint8_t is_cu_qp_delta_coded; ///< IsCuQpDeltaCoded
int cu_qg_top_left_x; ///< CuQgTopLeftX
int cu_qg_top_left_y; ///< CuQgTopLeftY
int is_cu_chroma_qp_offset_coded; ///< IsCuChromaQpOffsetCoded
int chroma_qp_offset[3]; ///< CuQpOffsetCb, CuQpOffsetCr, CuQpOffsetCbCr
int infer_tu_cbf_luma; ///< InferTuCbfLuma
int prev_tu_cbf_y; ///< prevTuCbfY;
int lfnst_dc_only; ///< LfnstDcOnly
int lfnst_zero_out_sig_coeff_flag; ///< LfnstZeroOutSigCoeffFlag
int mts_dc_only; ///< MtsDcOnly
int mts_zero_out_sig_coeff_flag; ///< MtsZeroOutSigCoeffFlag;
} parse;
struct {
// lmcs cache, for recon only
int chroma_scale;
int x_vpdu;
int y_vpdu;
} lmcs;
CodingUnit *cu;
ReconstructedArea ras[2][MAX_PARTS_IN_CTU];
int num_ras[2];
NeighbourAvailable na;
#define BOUNDARY_LEFT_SLICE (1 << 0)
#define BOUNDARY_LEFT_TILE (1 << 1)
#define BOUNDARY_LEFT_SUBPIC (1 << 2)
#define BOUNDARY_UPPER_SLICE (1 << 3)
#define BOUNDARY_UPPER_TILE (1 << 4)
#define BOUNDARY_UPPER_SUBPIC (1 << 5)
/* properties of the boundary of the current CTB for the purposes
* of the deblocking filter */
int boundary_flags;
SliceContext *sc;
VVCFrameContext *fc;
EntryPoint *ep;
int *coeffs;
} VVCLocalContext;
typedef struct VVCAllowedSplit {
int qt;
int btv;
int bth;
int ttv;
int tth;
} VVCAllowedSplit;
typedef struct SAOParams {
int offset_abs[3][4]; ///< sao_offset_abs
int offset_sign[3][4]; ///< sao_offset_sign
uint8_t band_position[3]; ///< sao_band_position
int eo_class[3]; ///< sao_eo_class
int16_t offset_val[3][5]; ///< SaoOffsetVal
uint8_t type_idx[3]; ///< sao_type_idx
} SAOParams;
typedef struct ALFParams {
uint8_t ctb_flag[3]; ///< alf_ctb_flag[]
uint8_t ctb_filt_set_idx_y; ///< AlfCtbFiltSetIdxY
uint8_t alf_ctb_filter_alt_idx[2]; ///< alf_ctb_filter_alt_idx[]
uint8_t ctb_cc_idc[2]; ///< alf_ctb_cc_cb_idc, alf_ctb_cc_cr_idc
uint8_t applied[3];
} ALFParams;
/**
* parse a CTU
* @param lc local context for CTU
* @param ctb_idx CTB(CTU) address in the current slice
* @param rs raster order for the CTU.
* @param rx raster order x for the CTU.
* @param ry raster order y for the CTU.
* @return AVERROR
*/
int ff_vvc_coding_tree_unit(VVCLocalContext *lc, int ctu_idx, int rs, int rx, int ry);
//utils
void ff_vvc_set_neighbour_available(VVCLocalContext *lc, int x0, int y0, int w, int h);
void ff_vvc_decode_neighbour(VVCLocalContext *lc, int x_ctb, int y_ctb, int rx, int ry, int rs);
void ff_vvc_ctu_free_cus(CTU *ctu);
int ff_vvc_get_qPy(const VVCFrameContext *fc, int xc, int yc);
void ff_vvc_ep_init_stat_coeff(EntryPoint *ep, int bit_depth, int persistent_rice_adaptation_enabled_flag);
#endif // AVCODEC_VVC_CTU_H
|