mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-01-19 05:49:09 +02:00
2e936f2c11
perf result for: "perf record -F 99 ./ffmpeg_g -i Tango2_3840x2160_60_10_420_27_LD.266 -f null -" before: 5.24% 1.87% ffmpeg_g [.] vvc_deblock_bs_chroma 1.72% ffmpeg_g [.] ff_vvc_deblock_bs 1.65% ffmpeg_g [.] vvc_deblock_bs_luma after: 3.48% 1.84% ffmpeg_g [.] vvc_deblock_bs_chroma 1.64% ffmpeg_g [.] ff_vvc_deblock_bs + vvc_deblock_bs_luma(inlined)
494 lines
14 KiB
C
494 lines
14 KiB
C
/*
|
|
* VVC CTU(Coding Tree Unit) parser
|
|
*
|
|
* Copyright (C) 2022 Nuo Mi
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#ifndef AVCODEC_VVC_CTU_H
|
|
#define AVCODEC_VVC_CTU_H
|
|
|
|
#include <stdbool.h>
|
|
|
|
#include "libavcodec/cabac.h"
|
|
#include "libavutil/mem_internal.h"
|
|
|
|
#include "dec.h"
|
|
|
|
#define MAX_CTU_SIZE 128
|
|
|
|
#define MAX_CU_SIZE MAX_CTU_SIZE
|
|
#define MIN_CU_SIZE 4
|
|
#define MIN_CU_LOG2 2
|
|
#define MAX_CU_DEPTH 7
|
|
|
|
#define MAX_PARTS_IN_CTU ((MAX_CTU_SIZE >> MIN_CU_LOG2) * (MAX_CTU_SIZE >> MIN_CU_LOG2))
|
|
|
|
#define MIN_PU_SIZE 4
|
|
|
|
#define MAX_TB_SIZE 64
|
|
#define MIN_TU_SIZE 4
|
|
#define MAX_TUS_IN_CU 64
|
|
|
|
#define MAX_QP 63
|
|
|
|
#define MAX_PB_SIZE 128
|
|
#define MAX_SCALING_RATIO 8
|
|
#define EDGE_EMU_BUFFER_STRIDE ((MAX_PB_SIZE + 32) * MAX_SCALING_RATIO)
|
|
|
|
#define CHROMA_EXTRA_BEFORE 1
|
|
#define CHROMA_EXTRA_AFTER 2
|
|
#define CHROMA_EXTRA 3
|
|
#define LUMA_EXTRA_BEFORE 3
|
|
#define LUMA_EXTRA_AFTER 4
|
|
#define LUMA_EXTRA 7
|
|
#define BILINEAR_EXTRA_BEFORE 0
|
|
#define BILINEAR_EXTRA_AFTER 1
|
|
#define BILINEAR_EXTRA 1
|
|
|
|
#define SCALED_INT(pos) ((pos) >> 10)
|
|
|
|
#define MAX_CONTROL_POINTS 3
|
|
|
|
#define AFFINE_MIN_BLOCK_SIZE 4
|
|
|
|
#define MRG_MAX_NUM_CANDS 6
|
|
#define MAX_NUM_HMVP_CANDS 5
|
|
|
|
#define SAO_PADDING_SIZE 1
|
|
|
|
#define ALF_PADDING_SIZE 8
|
|
#define ALF_BLOCK_SIZE 4
|
|
|
|
#define ALF_BORDER_LUMA 3
|
|
#define ALF_BORDER_CHROMA 2
|
|
|
|
#define ALF_VB_POS_ABOVE_LUMA 4
|
|
#define ALF_VB_POS_ABOVE_CHROMA 2
|
|
|
|
#define ALF_GRADIENT_STEP 2
|
|
#define ALF_GRADIENT_BORDER 2
|
|
#define ALF_GRADIENT_SIZE ((MAX_CU_SIZE + ALF_GRADIENT_BORDER * 2) / ALF_GRADIENT_STEP)
|
|
#define ALF_NUM_DIR 4
|
|
|
|
|
|
/**
|
|
* Value of the luma sample at position (x, y) in the 2D array tab.
|
|
*/
|
|
#define SAMPLE(tab, x, y) ((tab)[(y) * s->pps->width + (x)])
|
|
#define SAMPLE_CTB(tab, x, y) ((tab)[(y) * min_cb_width + (x)])
|
|
#define CTB(tab, x, y) ((tab)[(y) * fc->ps.pps->ctb_width + (x)])
|
|
|
|
enum SAOType {
|
|
SAO_NOT_APPLIED = 0,
|
|
SAO_BAND,
|
|
SAO_EDGE,
|
|
};
|
|
|
|
enum SAOEOClass {
|
|
SAO_EO_HORIZ = 0,
|
|
SAO_EO_VERT,
|
|
SAO_EO_135D,
|
|
SAO_EO_45D,
|
|
};
|
|
|
|
typedef struct NeighbourAvailable {
|
|
int cand_left;
|
|
int cand_up;
|
|
int cand_up_left;
|
|
int cand_up_right;
|
|
int cand_up_right_sap;
|
|
} NeighbourAvailable;
|
|
|
|
enum IspType{
|
|
ISP_NO_SPLIT,
|
|
ISP_HOR_SPLIT,
|
|
ISP_VER_SPLIT,
|
|
};
|
|
|
|
typedef enum VVCSplitMode {
|
|
SPLIT_NONE,
|
|
SPLIT_TT_HOR,
|
|
SPLIT_BT_HOR,
|
|
SPLIT_TT_VER,
|
|
SPLIT_BT_VER,
|
|
SPLIT_QT,
|
|
} VVCSplitMode;
|
|
|
|
typedef enum MtsIdx {
|
|
MTS_DCT2_DCT2,
|
|
MTS_DST7_DST7,
|
|
MTS_DST7_DCT8,
|
|
MTS_DCT8_DST7,
|
|
MTS_DCT8_DCT8,
|
|
} MtsIdx;
|
|
|
|
typedef struct TransformBlock {
|
|
uint8_t has_coeffs;
|
|
uint8_t c_idx;
|
|
uint8_t ts; ///< transform_skip_flag
|
|
int x0;
|
|
int y0;
|
|
|
|
int tb_width;
|
|
int tb_height;
|
|
int log2_tb_width;
|
|
int log2_tb_height;
|
|
|
|
int max_scan_x;
|
|
int max_scan_y;
|
|
int min_scan_x;
|
|
int min_scan_y;
|
|
|
|
int qp;
|
|
int rect_non_ts_flag;
|
|
int bd_shift;
|
|
int bd_offset;
|
|
|
|
int *coeffs;
|
|
} TransformBlock;
|
|
|
|
typedef enum VVCTreeType {
|
|
SINGLE_TREE,
|
|
DUAL_TREE_LUMA,
|
|
DUAL_TREE_CHROMA,
|
|
} VVCTreeType;
|
|
|
|
typedef struct TransformUnit {
|
|
int x0;
|
|
int y0;
|
|
int width;
|
|
int height;
|
|
bool avail[CHROMA + 1]; // contains luma/chroma block
|
|
|
|
uint8_t joint_cbcr_residual_flag; ///< tu_joint_cbcr_residual_flag
|
|
|
|
uint8_t coded_flag[VVC_MAX_SAMPLE_ARRAYS]; ///< tu_y_coded_flag, tu_cb_coded_flag, tu_cr_coded_flag
|
|
uint8_t nb_tbs;
|
|
TransformBlock tbs[VVC_MAX_SAMPLE_ARRAYS];
|
|
|
|
struct TransformUnit *next; ///< RefStruct reference
|
|
} TransformUnit;
|
|
|
|
typedef enum PredMode {
|
|
MODE_INTER,
|
|
MODE_INTRA,
|
|
MODE_SKIP,
|
|
MODE_PLT,
|
|
MODE_IBC,
|
|
} PredMode;
|
|
|
|
typedef struct Mv {
|
|
int x; ///< horizontal component of motion vector
|
|
int y; ///< vertical component of motion vector
|
|
} Mv;
|
|
|
|
typedef struct MvField {
|
|
DECLARE_ALIGNED(8, Mv, mv)[2]; ///< mvL0, vvL1
|
|
int8_t ref_idx[2]; ///< refIdxL0, refIdxL1
|
|
uint8_t hpel_if_idx; ///< hpelIfIdx
|
|
uint8_t bcw_idx; ///< bcwIdx
|
|
uint8_t pred_flag;
|
|
uint8_t ciip_flag; ///< ciip_flag
|
|
} MvField;
|
|
|
|
typedef struct DMVRInfo {
|
|
DECLARE_ALIGNED(8, Mv, mv)[2]; ///< mvL0, vvL1
|
|
uint8_t dmvr_enabled;
|
|
} DMVRInfo;
|
|
|
|
typedef enum MotionModelIdc {
|
|
MOTION_TRANSLATION,
|
|
MOTION_4_PARAMS_AFFINE,
|
|
MOTION_6_PARAMS_AFFINE,
|
|
} MotionModelIdc;
|
|
|
|
typedef enum PredFlag {
|
|
PF_INTRA = 0x0,
|
|
PF_L0 = 0x1,
|
|
PF_L1 = 0x2,
|
|
PF_BI = 0x3,
|
|
PF_IBC = PF_L0 | 0x4,
|
|
} PredFlag;
|
|
|
|
typedef enum IntraPredMode {
|
|
INTRA_INVALID = -1,
|
|
INTRA_PLANAR = 0,
|
|
INTRA_DC,
|
|
INTRA_HORZ = 18,
|
|
INTRA_DIAG = 34,
|
|
INTRA_VERT = 50,
|
|
INTRA_VDIAG = 66,
|
|
INTRA_LT_CCLM = 81,
|
|
INTRA_L_CCLM,
|
|
INTRA_T_CCLM
|
|
} IntraPredMode;
|
|
|
|
typedef struct MotionInfo {
|
|
MotionModelIdc motion_model_idc; ///< MotionModelIdc
|
|
int8_t ref_idx[2]; ///< refIdxL0, refIdxL1
|
|
uint8_t hpel_if_idx; ///< hpelIfIdx
|
|
uint8_t bcw_idx; ///< bcwIdx
|
|
PredFlag pred_flag;
|
|
|
|
Mv mv[2][MAX_CONTROL_POINTS];
|
|
|
|
int num_sb_x, num_sb_y;
|
|
} MotionInfo;
|
|
|
|
typedef struct PredictionUnit {
|
|
uint8_t general_merge_flag;
|
|
uint8_t mmvd_merge_flag;
|
|
//InterPredIdc inter_pred_idc;
|
|
uint8_t inter_affine_flag;
|
|
|
|
//subblock predict
|
|
uint8_t merge_subblock_flag;
|
|
|
|
uint8_t merge_gpm_flag;
|
|
uint8_t gpm_partition_idx;
|
|
MvField gpm_mv[2];
|
|
|
|
int sym_mvd_flag;
|
|
|
|
MotionInfo mi;
|
|
|
|
// for regular prediction only
|
|
uint8_t dmvr_flag;
|
|
uint8_t bdof_flag;
|
|
|
|
int16_t diff_mv_x[2][AFFINE_MIN_BLOCK_SIZE * AFFINE_MIN_BLOCK_SIZE]; ///< diffMvLX
|
|
int16_t diff_mv_y[2][AFFINE_MIN_BLOCK_SIZE * AFFINE_MIN_BLOCK_SIZE]; ///< diffMvLX
|
|
int cb_prof_flag[2];
|
|
} PredictionUnit;
|
|
|
|
typedef struct CodingUnit {
|
|
VVCTreeType tree_type;
|
|
int x0;
|
|
int y0;
|
|
int cb_width;
|
|
int cb_height;
|
|
int ch_type;
|
|
int cqt_depth;
|
|
|
|
uint8_t coded_flag;
|
|
|
|
uint8_t sbt_flag;
|
|
uint8_t sbt_horizontal_flag;
|
|
uint8_t sbt_pos_flag;
|
|
|
|
int lfnst_idx;
|
|
MtsIdx mts_idx;
|
|
|
|
uint8_t act_enabled_flag;
|
|
|
|
uint8_t intra_luma_ref_idx; ///< IntraLumaRefLineIdx[][]
|
|
uint8_t intra_mip_flag; ///< intra_mip_flag
|
|
uint8_t skip_flag; ///< cu_skip_flag;
|
|
|
|
//inter
|
|
uint8_t ciip_flag;
|
|
|
|
// Inferred parameters
|
|
enum IspType isp_split_type; ///< IntraSubPartitionsSplitType
|
|
|
|
enum PredMode pred_mode; ///< PredMode
|
|
|
|
int num_intra_subpartitions;
|
|
|
|
IntraPredMode intra_pred_mode_y; ///< IntraPredModeY
|
|
IntraPredMode intra_pred_mode_c; ///< IntraPredModeC
|
|
int mip_chroma_direct_flag; ///< MipChromaDirectFlag
|
|
|
|
int bdpcm_flag[VVC_MAX_SAMPLE_ARRAYS]; ///< BdpcmFlag
|
|
|
|
int apply_lfnst_flag[VVC_MAX_SAMPLE_ARRAYS]; ///< ApplyLfnstFlag[]
|
|
|
|
struct {
|
|
TransformUnit *head; ///< RefStruct reference
|
|
TransformUnit *tail; ///< RefStruct reference
|
|
} tus;
|
|
|
|
int8_t qp[4]; ///< QpY, Qp′Cb, Qp′Cr, Qp′CbCr
|
|
|
|
PredictionUnit pu;
|
|
|
|
struct CodingUnit *next; ///< RefStruct reference
|
|
} CodingUnit;
|
|
|
|
typedef struct CTU {
|
|
int max_y[2][VVC_MAX_REF_ENTRIES];
|
|
int max_y_idx[2];
|
|
int has_dmvr;
|
|
} CTU;
|
|
|
|
typedef struct ReconstructedArea {
|
|
int x;
|
|
int y;
|
|
int w;
|
|
int h;
|
|
} ReconstructedArea;
|
|
|
|
typedef struct VVCCabacState {
|
|
uint16_t state[2];
|
|
uint8_t shift[2];
|
|
} VVCCabacState;
|
|
|
|
// VVC_CONTEXTS matched with SYNTAX_ELEMENT_LAST, it's checked by cabac_init_state.
|
|
#define VVC_CONTEXTS 378
|
|
typedef struct EntryPoint {
|
|
int8_t qp_y; ///< QpY
|
|
|
|
int stat_coeff[VVC_MAX_SAMPLE_ARRAYS]; ///< StatCoeff
|
|
|
|
VVCCabacState cabac_state[VVC_CONTEXTS];
|
|
CABACContext cc;
|
|
|
|
int ctu_start;
|
|
int ctu_end;
|
|
|
|
uint8_t is_first_qg; // first quantization group
|
|
|
|
MvField hmvp[MAX_NUM_HMVP_CANDS]; ///< HmvpCandList
|
|
int num_hmvp; ///< NumHmvpCand
|
|
MvField hmvp_ibc[MAX_NUM_HMVP_CANDS]; ///< HmvpIbcCandList
|
|
int num_hmvp_ibc; ///< NumHmvpIbcCand
|
|
} EntryPoint;
|
|
|
|
typedef struct VVCLocalContext {
|
|
uint8_t ctb_left_flag;
|
|
uint8_t ctb_up_flag;
|
|
uint8_t ctb_up_right_flag;
|
|
uint8_t ctb_up_left_flag;
|
|
int end_of_tiles_x;
|
|
int end_of_tiles_y;
|
|
|
|
/* *2 for high bit depths */
|
|
DECLARE_ALIGNED(32, uint8_t, edge_emu_buffer)[EDGE_EMU_BUFFER_STRIDE * EDGE_EMU_BUFFER_STRIDE * 2];
|
|
DECLARE_ALIGNED(32, int16_t, tmp)[MAX_PB_SIZE * MAX_PB_SIZE];
|
|
DECLARE_ALIGNED(32, int16_t, tmp1)[MAX_PB_SIZE * MAX_PB_SIZE];
|
|
DECLARE_ALIGNED(32, int16_t, tmp2)[MAX_PB_SIZE * MAX_PB_SIZE];
|
|
DECLARE_ALIGNED(32, uint8_t, ciip_tmp)[MAX_PB_SIZE * MAX_PB_SIZE * 2];
|
|
DECLARE_ALIGNED(32, uint8_t, sao_buffer)[(MAX_CTU_SIZE + 2 * SAO_PADDING_SIZE) * EDGE_EMU_BUFFER_STRIDE * 2];
|
|
DECLARE_ALIGNED(32, uint8_t, alf_buffer_luma)[(MAX_CTU_SIZE + 2 * ALF_PADDING_SIZE) * EDGE_EMU_BUFFER_STRIDE * 2];
|
|
DECLARE_ALIGNED(32, uint8_t, alf_buffer_chroma)[(MAX_CTU_SIZE + 2 * ALF_PADDING_SIZE) * EDGE_EMU_BUFFER_STRIDE * 2];
|
|
DECLARE_ALIGNED(32, int32_t, alf_gradient_tmp)[ALF_GRADIENT_SIZE * ALF_GRADIENT_SIZE * ALF_NUM_DIR];
|
|
|
|
struct {
|
|
int sbt_num_fourths_tb0; ///< SbtNumFourthsTb0
|
|
|
|
uint8_t is_cu_qp_delta_coded; ///< IsCuQpDeltaCoded
|
|
int cu_qg_top_left_x; ///< CuQgTopLeftX
|
|
int cu_qg_top_left_y; ///< CuQgTopLeftY
|
|
int is_cu_chroma_qp_offset_coded; ///< IsCuChromaQpOffsetCoded
|
|
int chroma_qp_offset[3]; ///< CuQpOffsetCb, CuQpOffsetCr, CuQpOffsetCbCr
|
|
|
|
int infer_tu_cbf_luma; ///< InferTuCbfLuma
|
|
int prev_tu_cbf_y; ///< prevTuCbfY;
|
|
|
|
int lfnst_dc_only; ///< LfnstDcOnly
|
|
int lfnst_zero_out_sig_coeff_flag; ///< LfnstZeroOutSigCoeffFlag
|
|
|
|
int mts_dc_only; ///< MtsDcOnly
|
|
int mts_zero_out_sig_coeff_flag; ///< MtsZeroOutSigCoeffFlag;
|
|
} parse;
|
|
|
|
struct {
|
|
// lmcs cache, for recon only
|
|
int chroma_scale;
|
|
int x_vpdu;
|
|
int y_vpdu;
|
|
} lmcs;
|
|
|
|
CodingUnit *cu;
|
|
ReconstructedArea ras[2][MAX_PARTS_IN_CTU];
|
|
int num_ras[2];
|
|
|
|
NeighbourAvailable na;
|
|
|
|
#define BOUNDARY_LEFT_SLICE (1 << 0)
|
|
#define BOUNDARY_LEFT_TILE (1 << 1)
|
|
#define BOUNDARY_LEFT_SUBPIC (1 << 2)
|
|
#define BOUNDARY_UPPER_SLICE (1 << 3)
|
|
#define BOUNDARY_UPPER_TILE (1 << 4)
|
|
#define BOUNDARY_UPPER_SUBPIC (1 << 5)
|
|
/* properties of the boundary of the current CTB for the purposes
|
|
* of the deblocking filter */
|
|
int boundary_flags;
|
|
|
|
SliceContext *sc;
|
|
VVCFrameContext *fc;
|
|
EntryPoint *ep;
|
|
int *coeffs;
|
|
} VVCLocalContext;
|
|
|
|
typedef struct VVCAllowedSplit {
|
|
int qt;
|
|
int btv;
|
|
int bth;
|
|
int ttv;
|
|
int tth;
|
|
} VVCAllowedSplit;
|
|
|
|
typedef struct SAOParams {
|
|
int offset_abs[3][4]; ///< sao_offset_abs
|
|
int offset_sign[3][4]; ///< sao_offset_sign
|
|
|
|
uint8_t band_position[3]; ///< sao_band_position
|
|
|
|
int eo_class[3]; ///< sao_eo_class
|
|
|
|
int16_t offset_val[3][5]; ///< SaoOffsetVal
|
|
|
|
uint8_t type_idx[3]; ///< sao_type_idx
|
|
} SAOParams;
|
|
|
|
typedef struct ALFParams {
|
|
uint8_t ctb_flag[3]; ///< alf_ctb_flag[]
|
|
uint8_t ctb_filt_set_idx_y; ///< AlfCtbFiltSetIdxY
|
|
uint8_t alf_ctb_filter_alt_idx[2]; ///< alf_ctb_filter_alt_idx[]
|
|
uint8_t ctb_cc_idc[2]; ///< alf_ctb_cc_cb_idc, alf_ctb_cc_cr_idc
|
|
} ALFParams;
|
|
|
|
typedef struct VVCRect {
|
|
int l; // left
|
|
int t; // top
|
|
int r; // right
|
|
int b; // bottom
|
|
} VVCRect;
|
|
|
|
/**
|
|
* parse a CTU
|
|
* @param lc local context for CTU
|
|
* @param ctb_idx CTB(CTU) address in the current slice
|
|
* @param rs raster order for the CTU.
|
|
* @param rx raster order x for the CTU.
|
|
* @param ry raster order y for the CTU.
|
|
* @return AVERROR
|
|
*/
|
|
int ff_vvc_coding_tree_unit(VVCLocalContext *lc, int ctu_idx, int rs, int rx, int ry);
|
|
|
|
//utils
|
|
void ff_vvc_set_neighbour_available(VVCLocalContext *lc, int x0, int y0, int w, int h);
|
|
void ff_vvc_decode_neighbour(VVCLocalContext *lc, int x_ctb, int y_ctb, int rx, int ry, int rs);
|
|
void ff_vvc_ctu_free_cus(CodingUnit **cus);
|
|
int ff_vvc_get_qPy(const VVCFrameContext *fc, int xc, int yc);
|
|
void ff_vvc_ep_init_stat_coeff(EntryPoint *ep, int bit_depth, int persistent_rice_adaptation_enabled_flag);
|
|
|
|
#endif // AVCODEC_VVC_CTU_H
|