You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

354 lines
14 KiB

/*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
/**
* @file
* EVC decoder/parser shared code
*/
#ifndef AVCODEC_EVC_PARSE_H
#define AVCODEC_EVC_PARSE_H
#define EVC_MAX_QP_TABLE_SIZE 58
#define NUM_CPB 32
// rpl structure
typedef struct RefPicListStruct {
int poc;
int tid;
int ref_pic_num;
int ref_pic_active_num;
int ref_pics[EVC_MAX_NUM_REF_PICS];
char pic_type;
} RefPicListStruct;
// chromaQP table structure to be signalled in SPS
typedef struct ChromaQpTable {
int chroma_qp_table_present_flag; // u(1)
int same_qp_table_for_chroma; // u(1)
int global_offset_flag; // u(1)
int num_points_in_qp_table_minus1[2]; // ue(v)
int delta_qp_in_val_minus1[2][EVC_MAX_QP_TABLE_SIZE]; // u(6)
int delta_qp_out_val[2][EVC_MAX_QP_TABLE_SIZE]; // se(v)
} ChromaQpTable;
// Hypothetical Reference Decoder (HRD) parameters, part of VUI
typedef struct HRDParameters {
int cpb_cnt_minus1; // ue(v)
int bit_rate_scale; // u(4)
int cpb_size_scale; // u(4)
int bit_rate_value_minus1[NUM_CPB]; // ue(v)
int cpb_size_value_minus1[NUM_CPB]; // ue(v)
int cbr_flag[NUM_CPB]; // u(1)
int initial_cpb_removal_delay_length_minus1; // u(5)
int cpb_removal_delay_length_minus1; // u(5)
int dpb_output_delay_length_minus1; // u(5)
int time_offset_length; // u(5)
} HRDParameters;
// video usability information (VUI) part of SPS
typedef struct VUIParameters {
int aspect_ratio_info_present_flag; // u(1)
int aspect_ratio_idc; // u(8)
int sar_width; // u(16)
int sar_height; // u(16)
int overscan_info_present_flag; // u(1)
int overscan_appropriate_flag; // u(1)
int video_signal_type_present_flag; // u(1)
int video_format; // u(3)
int video_full_range_flag; // u(1)
int colour_description_present_flag; // u(1)
int colour_primaries; // u(8)
int transfer_characteristics; // u(8)
int matrix_coefficients; // u(8)
int chroma_loc_info_present_flag; // u(1)
int chroma_sample_loc_type_top_field; // ue(v)
int chroma_sample_loc_type_bottom_field; // ue(v)
int neutral_chroma_indication_flag; // u(1)
int field_seq_flag; // u(1)
int timing_info_present_flag; // u(1)
int num_units_in_tick; // u(32)
int time_scale; // u(32)
int fixed_pic_rate_flag; // u(1)
int nal_hrd_parameters_present_flag; // u(1)
int vcl_hrd_parameters_present_flag; // u(1)
int low_delay_hrd_flag; // u(1)
int pic_struct_present_flag; // u(1)
int bitstream_restriction_flag; // u(1)
int motion_vectors_over_pic_boundaries_flag; // u(1)
int max_bytes_per_pic_denom; // ue(v)
int max_bits_per_mb_denom; // ue(v)
int log2_max_mv_length_horizontal; // ue(v)
int log2_max_mv_length_vertical; // ue(v)
int num_reorder_pics; // ue(v)
int max_dec_pic_buffering; // ue(v)
HRDParameters hrd_parameters;
} VUIParameters;
// The sturcture reflects SPS RBSP(raw byte sequence payload) layout
// @see ISO_IEC_23094-1 section 7.3.2.1
//
// The following descriptors specify the parsing process of each element
// u(n) - unsigned integer using n bits
// ue(v) - unsigned integer 0-th order Exp_Golomb-coded syntax element with the left bit first
typedef struct EVCParserSPS {
int sps_seq_parameter_set_id; // ue(v)
int profile_idc; // u(8)
int level_idc; // u(8)
int toolset_idc_h; // u(32)
int toolset_idc_l; // u(32)
int chroma_format_idc; // ue(v)
int pic_width_in_luma_samples; // ue(v)
int pic_height_in_luma_samples; // ue(v)
int bit_depth_luma_minus8; // ue(v)
int bit_depth_chroma_minus8; // ue(v)
int sps_btt_flag; // u(1)
int log2_ctu_size_minus5; // ue(v)
int log2_min_cb_size_minus2; // ue(v)
int log2_diff_ctu_max_14_cb_size; // ue(v)
int log2_diff_ctu_max_tt_cb_size; // ue(v)
int log2_diff_min_cb_min_tt_cb_size_minus2; // ue(v)
int sps_suco_flag; // u(1)
int log2_diff_ctu_size_max_suco_cb_size; // ue(v)
int log2_diff_max_suco_min_suco_cb_size; // ue(v)
int sps_admvp_flag; // u(1)
int sps_affine_flag; // u(1)
int sps_amvr_flag; // u(1)
int sps_dmvr_flag; // u(1)
int sps_mmvd_flag; // u(1)
int sps_hmvp_flag; // u(1)
int sps_eipd_flag; // u(1)
int sps_ibc_flag; // u(1)
int log2_max_ibc_cand_size_minus2; // ue(v)
int sps_cm_init_flag; // u(1)
int sps_adcc_flag; // u(1)
int sps_iqt_flag; // u(1)
int sps_ats_flag; // u(1)
int sps_addb_flag; // u(1)
int sps_alf_flag; // u(1)
int sps_htdf_flag; // u(1)
int sps_rpl_flag; // u(1)
int sps_pocs_flag; // u(1)
int sps_dquant_flag; // u(1)
int sps_dra_flag; // u(1)
int log2_max_pic_order_cnt_lsb_minus4; // ue(v)
int log2_sub_gop_length; // ue(v)
int log2_ref_pic_gap_length; // ue(v)
int max_num_tid0_ref_pics; // ue(v)
int sps_max_dec_pic_buffering_minus1; // ue(v)
int long_term_ref_pic_flag; // u(1)
int rpl1_same_as_rpl0_flag; // u(1)
int num_ref_pic_list_in_sps[2]; // ue(v)
struct RefPicListStruct rpls[2][EVC_MAX_NUM_RPLS];
int picture_cropping_flag; // u(1)
int picture_crop_left_offset; // ue(v)
int picture_crop_right_offset; // ue(v)
int picture_crop_top_offset; // ue(v)
int picture_crop_bottom_offset; // ue(v)
struct ChromaQpTable chroma_qp_table_struct;
int vui_parameters_present_flag; // u(1)
struct VUIParameters vui_parameters;
} EVCParserSPS;
typedef struct EVCParserPPS {
int pps_pic_parameter_set_id; // ue(v)
int pps_seq_parameter_set_id; // ue(v)
int num_ref_idx_default_active_minus1[2]; // ue(v)
int additional_lt_poc_lsb_len; // ue(v)
int rpl1_idx_present_flag; // u(1)
int single_tile_in_pic_flag; // u(1)
int num_tile_columns_minus1; // ue(v)
int num_tile_rows_minus1; // ue(v)
int uniform_tile_spacing_flag; // u(1)
int tile_column_width_minus1[EVC_MAX_TILE_ROWS]; // ue(v)
int tile_row_height_minus1[EVC_MAX_TILE_COLUMNS]; // ue(v)
int loop_filter_across_tiles_enabled_flag; // u(1)
int tile_offset_len_minus1; // ue(v)
int tile_id_len_minus1; // ue(v)
int explicit_tile_id_flag; // u(1)
int tile_id_val[EVC_MAX_TILE_ROWS][EVC_MAX_TILE_COLUMNS]; // u(v)
int pic_dra_enabled_flag; // u(1)
int pic_dra_aps_id; // u(5)
int arbitrary_slice_present_flag; // u(1)
int constrained_intra_pred_flag; // u(1)
int cu_qp_delta_enabled_flag; // u(1)
int log2_cu_qp_delta_area_minus6; // ue(v)
} EVCParserPPS;
// The sturcture reflects Slice Header RBSP(raw byte sequence payload) layout
// @see ISO_IEC_23094-1 section 7.3.2.6
//
// The following descriptors specify the parsing process of each element
// u(n) - unsigned integer using n bits
// ue(v) - unsigned integer 0-th order Exp_Golomb-coded syntax element with the left bit first
// u(n) - unsigned integer using n bits.
// When n is "v" in the syntax table, the number of bits varies in a manner dependent on the value of other syntax elements.
typedef struct EVCParserSliceHeader {
int slice_pic_parameter_set_id; // ue(v)
int single_tile_in_slice_flag; // u(1)
int first_tile_id; // u(v)
int arbitrary_slice_flag; // u(1)
int last_tile_id; // u(v)
int num_remaining_tiles_in_slice_minus1; // ue(v)
int delta_tile_id_minus1[EVC_MAX_TILE_ROWS * EVC_MAX_TILE_COLUMNS]; // ue(v)
int slice_type; // ue(v)
int no_output_of_prior_pics_flag; // u(1)
int mmvd_group_enable_flag; // u(1)
int slice_alf_enabled_flag; // u(1)
int slice_alf_luma_aps_id; // u(5)
int slice_alf_map_flag; // u(1)
int slice_alf_chroma_idc; // u(2)
int slice_alf_chroma_aps_id; // u(5)
int slice_alf_chroma_map_flag; // u(1)
int slice_alf_chroma2_aps_id; // u(5)
int slice_alf_chroma2_map_flag; // u(1)
int slice_pic_order_cnt_lsb; // u(v)
// @note
// Currently the structure does not reflect the entire Slice Header RBSP layout.
// It contains only the fields that are necessary to read from the NAL unit all the values
// necessary for the correct initialization of the AVCodecContext structure.
// @note
// If necessary, add the missing fields to the structure to reflect
// the contents of the entire NAL unit of the SPS type
} EVCParserSliceHeader;
// picture order count of the current picture
typedef struct EVCParserPoc {
int PicOrderCntVal; // current picture order count value
int prevPicOrderCntVal; // the picture order count of the previous Tid0 picture
int DocOffset; // the decoding order count of the previous picture
} EVCParserPoc;
typedef struct EVCParserContext {
//ParseContext pc;
EVCParserSPS *sps[EVC_MAX_SPS_COUNT];
EVCParserPPS *pps[EVC_MAX_PPS_COUNT];
EVCParserPoc poc;
int nuh_temporal_id; // the value of TemporalId (shall be the same for all VCL NAL units of an Access Unit)
int nalu_type; // the current NALU type
// Dimensions of the decoded video intended for presentation.
int width;
int height;
// Dimensions of the coded video.
int coded_width;
int coded_height;
// The format of the coded data, corresponds to enum AVPixelFormat
int format;
// AV_PICTURE_TYPE_I, EVC_SLICE_TYPE_P, AV_PICTURE_TYPE_B
int pict_type;
// Set by parser to 1 for key frames and 0 for non-key frames
int key_frame;
// Picture number incremented in presentation or output order.
// This corresponds to EVCEVCParserPoc::PicOrderCntVal
int output_picture_number;
// profile
// 0: FF_PROFILE_EVC_BASELINE
// 1: FF_PROFILE_EVC_MAIN
int profile;
// Framerate value in the compressed bitstream
AVRational framerate;
// Number of pictures in a group of pictures
int gop_size;
// Number of frames the decoded output will be delayed relative to the encoded input
int delay;
int parsed_extradata;
} EVCParserContext;
static inline int evc_get_nalu_type(const uint8_t *bits, int bits_size, void *logctx)
{
int unit_type_plus1 = 0;
if (bits_size >= EVC_NALU_HEADER_SIZE) {
unsigned char *p = (unsigned char *)bits;
// forbidden_zero_bit
if ((p[0] & 0x80) != 0) {
av_log(logctx, AV_LOG_ERROR, "Invalid NAL unit header\n");
return -1;
}
// nal_unit_type
unit_type_plus1 = (p[0] >> 1) & 0x3F;
}
return unit_type_plus1 - 1;
}
static inline uint32_t evc_read_nal_unit_length(const uint8_t *bits, int bits_size, void *logctx)
{
uint32_t nalu_len = 0;
if (bits_size < EVC_NALU_LENGTH_PREFIX_SIZE) {
av_log(logctx, AV_LOG_ERROR, "Can't read NAL unit length\n");
return 0;
}
nalu_len = AV_RB32(bits);
return nalu_len;
}
// nuh_temporal_id specifies a temporal identifier for the NAL unit
int ff_evc_get_temporal_id(const uint8_t *bits, int bits_size, void *logctx);
// @see ISO_IEC_23094-1 (7.3.2.1 SPS RBSP syntax)
EVCParserSPS *ff_evc_parse_sps(EVCParserContext *ctx, const uint8_t *bs, int bs_size);
// @see ISO_IEC_23094-1 (7.3.2.2 SPS RBSP syntax)
EVCParserPPS *ff_evc_parse_pps(EVCParserContext *ctx, const uint8_t *bs, int bs_size);
int ff_evc_parse_nal_unit(EVCParserContext *ctx, const uint8_t *buf, int buf_size, void *logctx);
#endif /* AVCODEC_EVC_PARSE_H */