ffmpeg/libavcodec/vvc/ps.h
Frank Plowman 993c231de0 lavc/vvc: Increase size of ctb_size_y
sps_log2_ctu_size_minus5 is between 0 and 2, with 3 reserved for future
use.  The VVC decoder allows sps_log2_ctu_size_minus5 to be 3, and so
ctb_size_y should be at least 16 bits to prevent overflows.  An
alternative patch would leave sps_log2_ctu_size_minus5 as 8 bits and
disallow sps_log2_ctu_size_minus5 = 3.

Signed-off-by: Frank Plowman <post@frankplowman.com>
2024-04-15 21:06:13 +08:00

270 lines
11 KiB
C
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

/*
* VVC parameter set parser
*
* Copyright (C) 2023 Nuo Mi
*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#ifndef AVCODEC_VVC_PS_H
#define AVCODEC_VVC_PS_H
#include "libavcodec/cbs_h266.h"
#include "libavcodec/vvc.h"
#define IS_IDR(s) ((s)->vcl_unit_type == VVC_IDR_W_RADL || (s)->vcl_unit_type == VVC_IDR_N_LP)
#define IS_CRA(s) ((s)->vcl_unit_type == VVC_CRA_NUT)
#define IS_IRAP(s) (IS_IDR(s) || IS_CRA(s))
#define IS_GDR(s) ((s)->vcl_unit_type == VVC_GDR_NUT)
#define IS_CVSS(s) (IS_IRAP(s)|| IS_GDR(s))
#define IS_CLVSS(s) (IS_CVSS(s) && s->no_output_before_recovery_flag)
#define IS_RASL(s) ((s)->vcl_unit_type == VVC_RASL_NUT)
#define IS_RADL(s) ((s)->vcl_unit_type == VVC_RADL_NUT)
#define IS_I(rsh) ((rsh)->sh_slice_type == VVC_SLICE_TYPE_I)
#define IS_P(rsh) ((rsh)->sh_slice_type == VVC_SLICE_TYPE_P)
#define IS_B(rsh) ((rsh)->sh_slice_type == VVC_SLICE_TYPE_B)
#define INV_POC INT_MIN
#define GDR_IS_RECOVERED(s) (s->gdr_recovery_point_poc == INV_POC)
#define GDR_SET_RECOVERED(s) (s->gdr_recovery_point_poc = INV_POC)
#define LMCS_MAX_BIT_DEPTH 12
#define LMCS_MAX_LUT_SIZE (1 << LMCS_MAX_BIT_DEPTH)
#define LMCS_MAX_BIN_SIZE 16
#define LADF_MAX_INTERVAL 5
enum {
CHROMA_FORMAT_MONO,
CHROMA_FORMAT_420,
CHROMA_FORMAT_422,
CHROMA_FORMAT_444,
};
typedef struct VVCSPS {
const H266RawSPS *r; ///< RefStruct reference
//derived values
uint8_t hshift[VVC_MAX_SAMPLE_ARRAYS];
uint8_t vshift[VVC_MAX_SAMPLE_ARRAYS];
uint32_t max_pic_order_cnt_lsb; ///< MaxPicOrderCntLsb
uint8_t pixel_shift;
enum AVPixelFormat pix_fmt;
uint8_t bit_depth; ///< BitDepth
uint8_t qp_bd_offset; ///< QpBdOffset
uint8_t ctb_log2_size_y; ///< CtbLog2SizeY
uint16_t ctb_size_y; ///< CtbSizeY
uint8_t min_cb_log2_size_y; ///< MinCbLog2SizeY
uint8_t min_cb_size_y; ///< MinCbSizeY
uint8_t max_tb_size_y; ///< MaxTbSizeY
uint8_t max_ts_size; ///< MaxTsSize
uint8_t max_num_merge_cand; ///< MaxNumMergeCand
uint8_t max_num_ibc_merge_cand; ///< MaxNumIbcMergeCand
uint8_t max_num_gpm_merge_cand; ///< MaxNumGpmMergeCand
uint8_t num_ladf_intervals; ///< sps_num_ladf_intervals_minus2 + 2;
uint32_t ladf_interval_lower_bound[LADF_MAX_INTERVAL]; ///< SpsLadfIntervalLowerBound[]
uint8_t log2_parallel_merge_level; ///< sps_log2_parallel_merge_level_minus2 + 2;
uint8_t log2_transform_range; ///< Log2TransformRange
int8_t chroma_qp_table[3][VVC_MAX_POINTS_IN_QP_TABLE]; ///< ChromaQpTable
} VVCSPS;
typedef struct DBParams {
int8_t beta_offset[VVC_MAX_SAMPLE_ARRAYS];
int8_t tc_offset[VVC_MAX_SAMPLE_ARRAYS];
} DBParams;
typedef struct VVCPPS {
const H266RawPPS *r; ///< RefStruct reference
//derived value;
int8_t chroma_qp_offset[3]; ///< pps_cb_qp_offset, pps_cr_qp_offset, pps_joint_cbcr_qp_offset_value
int8_t chroma_qp_offset_list[6][3]; ///< pps_cb_qp_offset_list, pps_cr_qp_offset_list, pps_joint_cbcr_qp_offset_list
uint16_t width;
uint16_t height;
uint16_t slice_start_offset[VVC_MAX_SLICES];
uint16_t num_ctus_in_slice [VVC_MAX_SLICES];
uint16_t min_cb_width;
uint16_t min_cb_height;
uint16_t ctb_width;
uint16_t ctb_height;
uint32_t ctb_count;
uint16_t min_pu_width;
uint16_t min_pu_height;
uint16_t min_tu_width;
uint16_t min_tu_height;
uint32_t *ctb_addr_in_slice; ///< CtbAddrInCurrSlice for entire picture
uint16_t *col_bd; ///< TileColBdVal
uint16_t *row_bd; ///< TileRowBdVal
uint16_t *ctb_to_col_bd; ///< CtbToTileColBd
uint16_t *ctb_to_row_bd; ///< CtbToTileRowBd
uint16_t width32; ///< width in 32 pixels
uint16_t height32; ///< height in 32 pixels
uint16_t width64; ///< width in 64 pixels
uint16_t height64; ///< height in 64 pixels
uint16_t ref_wraparound_offset; ///< PpsRefWraparoundOffset
uint16_t subpic_x[VVC_MAX_SLICES]; ///< SubpicLeftBoundaryPos
uint16_t subpic_y[VVC_MAX_SLICES]; ///< SubpicTopBoundaryPos
uint16_t subpic_width[VVC_MAX_SLICES];
uint16_t subpic_height[VVC_MAX_SLICES];
} VVCPPS;
#define MAX_WEIGHTS 15
typedef struct PredWeightTable {
uint8_t log2_denom[2]; ///< luma_log2_weight_denom, ChromaLog2WeightDenom
uint8_t nb_weights[2]; ///< num_l0_weights, num_l1_weights
uint8_t weight_flag[2][2][MAX_WEIGHTS]; ///< luma_weight_l0_flag, chroma_weight_l0_flag,
///< luma_weight_l1_flag, chroma_weight_l1_flag,
int16_t weight[2][VVC_MAX_SAMPLE_ARRAYS][MAX_WEIGHTS]; ///< LumaWeightL0, LumaWeightL1, ChromaWeightL0, ChromaWeightL1
int16_t offset[2][VVC_MAX_SAMPLE_ARRAYS][MAX_WEIGHTS]; ///< luma_offset_l0, luma_offset_l1, ChromaOffsetL0, ChromaOffsetL1
} PredWeightTable;
typedef struct VVCPH {
const H266RawPictureHeader *r;
void *rref; ///< RefStruct reference, backing ph above
//derived values
uint32_t max_num_subblock_merge_cand; ///< MaxNumSubblockMergeCand
int32_t poc; ///< PicOrderCntVal
PredWeightTable pwt;
} VVCPH;
#define ALF_NUM_FILTERS_LUMA 25
#define ALF_NUM_FILTERS_CHROMA 8
#define ALF_NUM_FILTERS_CC 4
#define ALF_NUM_COEFF_LUMA 12
#define ALF_NUM_COEFF_CHROMA 6
#define ALF_NUM_COEFF_CC 7
typedef struct VVCALF {
int16_t luma_coeff [ALF_NUM_FILTERS_LUMA][ALF_NUM_COEFF_LUMA];
uint8_t luma_clip_idx [ALF_NUM_FILTERS_LUMA][ALF_NUM_COEFF_LUMA];
uint8_t num_chroma_filters;
int16_t chroma_coeff [ALF_NUM_FILTERS_CHROMA][ALF_NUM_COEFF_CHROMA];
uint8_t chroma_clip_idx[ALF_NUM_FILTERS_CHROMA][ALF_NUM_COEFF_CHROMA];
uint8_t num_cc_filters[2]; ///< alf_cc_cb_filters_signalled_minus1 + 1, alf_cc_cr_filters_signalled_minus1 + 1
int16_t cc_coeff[2][ALF_NUM_FILTERS_CC][ALF_NUM_COEFF_CC];
} VVCALF;
enum {
SL_START_2x2 = 0,
SL_START_4x4 = 2,
SL_START_8x8 = 8,
SL_START_16x16 = 14,
SL_START_32x32 = 20,
SL_START_64x64 = 26,
SL_MAX_ID = 28,
};
#define SL_MAX_MATRIX_SIZE 8
typedef struct VVCScalingList {
uint8_t scaling_matrix_rec[SL_MAX_ID][SL_MAX_MATRIX_SIZE * SL_MAX_MATRIX_SIZE]; ///< ScalingMatrixRec
uint8_t scaling_matrix_dc_rec[SL_MAX_ID - SL_START_16x16]; ///< ScalingMatrixDcRec[refId 14]
} VVCScalingList;
typedef struct VVCLMCS {
uint8_t min_bin_idx;
uint8_t max_bin_idx;
union {
uint8_t u8[LMCS_MAX_LUT_SIZE];
uint16_t u16[LMCS_MAX_LUT_SIZE]; ///< for high bit-depth
} fwd_lut, inv_lut;
uint16_t pivot[LMCS_MAX_BIN_SIZE + 1];
uint16_t chroma_scale_coeff[LMCS_MAX_BIN_SIZE];
} VVCLMCS;
#define VVC_MAX_ALF_COUNT 8
#define VVC_MAX_LMCS_COUNT 4
#define VVC_MAX_SL_COUNT 8
typedef struct VVCParamSets {
const VVCSPS *sps_list[VVC_MAX_SPS_COUNT]; ///< RefStruct reference
const VVCPPS *pps_list[VVC_MAX_PPS_COUNT]; ///< RefStruct reference
const VVCALF *alf_list[VVC_MAX_ALF_COUNT]; ///< RefStruct reference
const H266RawAPS *lmcs_list[VVC_MAX_LMCS_COUNT]; ///< RefStruct reference
const VVCScalingList *scaling_list[VVC_MAX_SL_COUNT]; ///< RefStruct reference
// Bit field of SPS IDs used in the current CVS
uint16_t sps_id_used;
} VVCParamSets;
typedef struct VVCFrameParamSets {
const VVCSPS *sps; ///< RefStruct reference
const VVCPPS *pps; ///< RefStruct reference
VVCPH ph;
const VVCALF *alf_list[VVC_MAX_ALF_COUNT]; ///< RefStruct reference
VVCLMCS lmcs;
const VVCScalingList *sl; ///< RefStruct reference
} VVCFrameParamSets;
typedef struct VVCSH {
const H266RawSliceHeader *r; ///< RefStruct reference
// derived values
// ctu address
uint32_t num_ctus_in_curr_slice; ///< NumCtusInCurrSlice
const uint32_t* ctb_addr_in_curr_slice; ///< CtbAddrInCurrSlice
// inter
PredWeightTable pwt;
int8_t ref_idx_sym[2]; ///< RefIdxSymL0, RefIdxSymL1
// qp_y
int8_t slice_qp_y; ///< SliceQpY
// deblock_offsets
DBParams deblock;
// partition constrains
uint8_t min_qt_size[2]; ///< MinQtSizeY, MinQtSizeC
uint8_t max_bt_size[2]; ///< MaxBtSizeY, MaxBtSizeC
uint8_t max_tt_size[2]; ///< MaxTtSizeY, MaxTtSizeC
uint8_t max_mtt_depth[2]; ///< MaxMttDepthY, MaxMttDepthC
uint8_t cu_qp_delta_subdiv; ///< CuQpDeltaSubdiv
uint8_t cu_chroma_qp_offset_subdiv; ///< CuChromaQpOffsetSubdiv
// entries
uint32_t entry_point_start_ctu[VVC_MAX_ENTRY_POINTS]; ///< entry point start in ctu_addr
} VVCSH;
struct VVCContext;
int ff_vvc_decode_frame_ps(VVCFrameParamSets *fps, struct VVCContext *s);
int ff_vvc_decode_aps(VVCParamSets *ps, const CodedBitstreamUnit *unit);
int ff_vvc_decode_sh(VVCSH *sh, const VVCFrameParamSets *ps, const CodedBitstreamUnit *unit);
void ff_vvc_frame_ps_free(VVCFrameParamSets *fps);
void ff_vvc_ps_uninit(VVCParamSets *ps);
#endif /* AVCODEC_VVC_PS_H */