mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
354 lines
14 KiB
354 lines
14 KiB
1 year ago
|
/*
|
||
|
* This file is part of FFmpeg.
|
||
|
*
|
||
|
* FFmpeg is free software; you can redistribute it and/or
|
||
|
* modify it under the terms of the GNU Lesser General Public
|
||
|
* License as published by the Free Software Foundation; either
|
||
|
* version 2.1 of the License, or (at your option) any later version.
|
||
|
*
|
||
|
* FFmpeg is distributed in the hope that it will be useful,
|
||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
|
* Lesser General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU Lesser General Public
|
||
|
* License along with FFmpeg; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
||
|
*/
|
||
|
|
||
|
/**
|
||
|
* @file
|
||
|
* EVC decoder/parser shared code
|
||
|
*/
|
||
|
|
||
|
#ifndef AVCODEC_EVC_PARSE_H
|
||
|
#define AVCODEC_EVC_PARSE_H
|
||
|
|
||
|
#define EVC_MAX_QP_TABLE_SIZE 58
|
||
|
#define NUM_CPB 32
|
||
|
|
||
|
// rpl structure
|
||
|
typedef struct RefPicListStruct {
|
||
|
int poc;
|
||
|
int tid;
|
||
|
int ref_pic_num;
|
||
|
int ref_pic_active_num;
|
||
|
int ref_pics[EVC_MAX_NUM_REF_PICS];
|
||
|
char pic_type;
|
||
|
|
||
|
} RefPicListStruct;
|
||
|
|
||
|
// chromaQP table structure to be signalled in SPS
|
||
|
typedef struct ChromaQpTable {
|
||
|
int chroma_qp_table_present_flag; // u(1)
|
||
|
int same_qp_table_for_chroma; // u(1)
|
||
|
int global_offset_flag; // u(1)
|
||
|
int num_points_in_qp_table_minus1[2]; // ue(v)
|
||
|
int delta_qp_in_val_minus1[2][EVC_MAX_QP_TABLE_SIZE]; // u(6)
|
||
|
int delta_qp_out_val[2][EVC_MAX_QP_TABLE_SIZE]; // se(v)
|
||
|
} ChromaQpTable;
|
||
|
|
||
|
// Hypothetical Reference Decoder (HRD) parameters, part of VUI
|
||
|
typedef struct HRDParameters {
|
||
|
int cpb_cnt_minus1; // ue(v)
|
||
|
int bit_rate_scale; // u(4)
|
||
|
int cpb_size_scale; // u(4)
|
||
|
int bit_rate_value_minus1[NUM_CPB]; // ue(v)
|
||
|
int cpb_size_value_minus1[NUM_CPB]; // ue(v)
|
||
|
int cbr_flag[NUM_CPB]; // u(1)
|
||
|
int initial_cpb_removal_delay_length_minus1; // u(5)
|
||
|
int cpb_removal_delay_length_minus1; // u(5)
|
||
|
int dpb_output_delay_length_minus1; // u(5)
|
||
|
int time_offset_length; // u(5)
|
||
|
} HRDParameters;
|
||
|
|
||
|
// video usability information (VUI) part of SPS
|
||
|
typedef struct VUIParameters {
|
||
|
int aspect_ratio_info_present_flag; // u(1)
|
||
|
int aspect_ratio_idc; // u(8)
|
||
|
int sar_width; // u(16)
|
||
|
int sar_height; // u(16)
|
||
|
int overscan_info_present_flag; // u(1)
|
||
|
int overscan_appropriate_flag; // u(1)
|
||
|
int video_signal_type_present_flag; // u(1)
|
||
|
int video_format; // u(3)
|
||
|
int video_full_range_flag; // u(1)
|
||
|
int colour_description_present_flag; // u(1)
|
||
|
int colour_primaries; // u(8)
|
||
|
int transfer_characteristics; // u(8)
|
||
|
int matrix_coefficients; // u(8)
|
||
|
int chroma_loc_info_present_flag; // u(1)
|
||
|
int chroma_sample_loc_type_top_field; // ue(v)
|
||
|
int chroma_sample_loc_type_bottom_field; // ue(v)
|
||
|
int neutral_chroma_indication_flag; // u(1)
|
||
|
int field_seq_flag; // u(1)
|
||
|
int timing_info_present_flag; // u(1)
|
||
|
int num_units_in_tick; // u(32)
|
||
|
int time_scale; // u(32)
|
||
|
int fixed_pic_rate_flag; // u(1)
|
||
|
int nal_hrd_parameters_present_flag; // u(1)
|
||
|
int vcl_hrd_parameters_present_flag; // u(1)
|
||
|
int low_delay_hrd_flag; // u(1)
|
||
|
int pic_struct_present_flag; // u(1)
|
||
|
int bitstream_restriction_flag; // u(1)
|
||
|
int motion_vectors_over_pic_boundaries_flag; // u(1)
|
||
|
int max_bytes_per_pic_denom; // ue(v)
|
||
|
int max_bits_per_mb_denom; // ue(v)
|
||
|
int log2_max_mv_length_horizontal; // ue(v)
|
||
|
int log2_max_mv_length_vertical; // ue(v)
|
||
|
int num_reorder_pics; // ue(v)
|
||
|
int max_dec_pic_buffering; // ue(v)
|
||
|
|
||
|
HRDParameters hrd_parameters;
|
||
|
} VUIParameters;
|
||
|
|
||
|
// The sturcture reflects SPS RBSP(raw byte sequence payload) layout
|
||
|
// @see ISO_IEC_23094-1 section 7.3.2.1
|
||
|
//
|
||
|
// The following descriptors specify the parsing process of each element
|
||
|
// u(n) - unsigned integer using n bits
|
||
|
// ue(v) - unsigned integer 0-th order Exp_Golomb-coded syntax element with the left bit first
|
||
|
typedef struct EVCParserSPS {
|
||
|
int sps_seq_parameter_set_id; // ue(v)
|
||
|
int profile_idc; // u(8)
|
||
|
int level_idc; // u(8)
|
||
|
int toolset_idc_h; // u(32)
|
||
|
int toolset_idc_l; // u(32)
|
||
|
int chroma_format_idc; // ue(v)
|
||
|
int pic_width_in_luma_samples; // ue(v)
|
||
|
int pic_height_in_luma_samples; // ue(v)
|
||
|
int bit_depth_luma_minus8; // ue(v)
|
||
|
int bit_depth_chroma_minus8; // ue(v)
|
||
|
|
||
|
int sps_btt_flag; // u(1)
|
||
|
int log2_ctu_size_minus5; // ue(v)
|
||
|
int log2_min_cb_size_minus2; // ue(v)
|
||
|
int log2_diff_ctu_max_14_cb_size; // ue(v)
|
||
|
int log2_diff_ctu_max_tt_cb_size; // ue(v)
|
||
|
int log2_diff_min_cb_min_tt_cb_size_minus2; // ue(v)
|
||
|
|
||
|
int sps_suco_flag; // u(1)
|
||
|
int log2_diff_ctu_size_max_suco_cb_size; // ue(v)
|
||
|
int log2_diff_max_suco_min_suco_cb_size; // ue(v)
|
||
|
|
||
|
int sps_admvp_flag; // u(1)
|
||
|
int sps_affine_flag; // u(1)
|
||
|
int sps_amvr_flag; // u(1)
|
||
|
int sps_dmvr_flag; // u(1)
|
||
|
int sps_mmvd_flag; // u(1)
|
||
|
int sps_hmvp_flag; // u(1)
|
||
|
|
||
|
int sps_eipd_flag; // u(1)
|
||
|
int sps_ibc_flag; // u(1)
|
||
|
int log2_max_ibc_cand_size_minus2; // ue(v)
|
||
|
|
||
|
int sps_cm_init_flag; // u(1)
|
||
|
int sps_adcc_flag; // u(1)
|
||
|
|
||
|
int sps_iqt_flag; // u(1)
|
||
|
int sps_ats_flag; // u(1)
|
||
|
|
||
|
int sps_addb_flag; // u(1)
|
||
|
int sps_alf_flag; // u(1)
|
||
|
int sps_htdf_flag; // u(1)
|
||
|
int sps_rpl_flag; // u(1)
|
||
|
int sps_pocs_flag; // u(1)
|
||
|
int sps_dquant_flag; // u(1)
|
||
|
int sps_dra_flag; // u(1)
|
||
|
|
||
|
int log2_max_pic_order_cnt_lsb_minus4; // ue(v)
|
||
|
int log2_sub_gop_length; // ue(v)
|
||
|
int log2_ref_pic_gap_length; // ue(v)
|
||
|
|
||
|
int max_num_tid0_ref_pics; // ue(v)
|
||
|
|
||
|
int sps_max_dec_pic_buffering_minus1; // ue(v)
|
||
|
int long_term_ref_pic_flag; // u(1)
|
||
|
int rpl1_same_as_rpl0_flag; // u(1)
|
||
|
int num_ref_pic_list_in_sps[2]; // ue(v)
|
||
|
struct RefPicListStruct rpls[2][EVC_MAX_NUM_RPLS];
|
||
|
|
||
|
int picture_cropping_flag; // u(1)
|
||
|
int picture_crop_left_offset; // ue(v)
|
||
|
int picture_crop_right_offset; // ue(v)
|
||
|
int picture_crop_top_offset; // ue(v)
|
||
|
int picture_crop_bottom_offset; // ue(v)
|
||
|
|
||
|
struct ChromaQpTable chroma_qp_table_struct;
|
||
|
|
||
|
int vui_parameters_present_flag; // u(1)
|
||
|
|
||
|
struct VUIParameters vui_parameters;
|
||
|
|
||
|
} EVCParserSPS;
|
||
|
|
||
|
typedef struct EVCParserPPS {
|
||
|
int pps_pic_parameter_set_id; // ue(v)
|
||
|
int pps_seq_parameter_set_id; // ue(v)
|
||
|
int num_ref_idx_default_active_minus1[2]; // ue(v)
|
||
|
int additional_lt_poc_lsb_len; // ue(v)
|
||
|
int rpl1_idx_present_flag; // u(1)
|
||
|
int single_tile_in_pic_flag; // u(1)
|
||
|
int num_tile_columns_minus1; // ue(v)
|
||
|
int num_tile_rows_minus1; // ue(v)
|
||
|
int uniform_tile_spacing_flag; // u(1)
|
||
|
int tile_column_width_minus1[EVC_MAX_TILE_ROWS]; // ue(v)
|
||
|
int tile_row_height_minus1[EVC_MAX_TILE_COLUMNS]; // ue(v)
|
||
|
int loop_filter_across_tiles_enabled_flag; // u(1)
|
||
|
int tile_offset_len_minus1; // ue(v)
|
||
|
int tile_id_len_minus1; // ue(v)
|
||
|
int explicit_tile_id_flag; // u(1)
|
||
|
int tile_id_val[EVC_MAX_TILE_ROWS][EVC_MAX_TILE_COLUMNS]; // u(v)
|
||
|
int pic_dra_enabled_flag; // u(1)
|
||
|
int pic_dra_aps_id; // u(5)
|
||
|
int arbitrary_slice_present_flag; // u(1)
|
||
|
int constrained_intra_pred_flag; // u(1)
|
||
|
int cu_qp_delta_enabled_flag; // u(1)
|
||
|
int log2_cu_qp_delta_area_minus6; // ue(v)
|
||
|
|
||
|
} EVCParserPPS;
|
||
|
|
||
|
// The sturcture reflects Slice Header RBSP(raw byte sequence payload) layout
|
||
|
// @see ISO_IEC_23094-1 section 7.3.2.6
|
||
|
//
|
||
|
// The following descriptors specify the parsing process of each element
|
||
|
// u(n) - unsigned integer using n bits
|
||
|
// ue(v) - unsigned integer 0-th order Exp_Golomb-coded syntax element with the left bit first
|
||
|
// u(n) - unsigned integer using n bits.
|
||
|
// When n is "v" in the syntax table, the number of bits varies in a manner dependent on the value of other syntax elements.
|
||
|
typedef struct EVCParserSliceHeader {
|
||
|
int slice_pic_parameter_set_id; // ue(v)
|
||
|
int single_tile_in_slice_flag; // u(1)
|
||
|
int first_tile_id; // u(v)
|
||
|
int arbitrary_slice_flag; // u(1)
|
||
|
int last_tile_id; // u(v)
|
||
|
int num_remaining_tiles_in_slice_minus1; // ue(v)
|
||
|
int delta_tile_id_minus1[EVC_MAX_TILE_ROWS * EVC_MAX_TILE_COLUMNS]; // ue(v)
|
||
|
|
||
|
int slice_type; // ue(v)
|
||
|
int no_output_of_prior_pics_flag; // u(1)
|
||
|
int mmvd_group_enable_flag; // u(1)
|
||
|
int slice_alf_enabled_flag; // u(1)
|
||
|
|
||
|
int slice_alf_luma_aps_id; // u(5)
|
||
|
int slice_alf_map_flag; // u(1)
|
||
|
int slice_alf_chroma_idc; // u(2)
|
||
|
int slice_alf_chroma_aps_id; // u(5)
|
||
|
int slice_alf_chroma_map_flag; // u(1)
|
||
|
int slice_alf_chroma2_aps_id; // u(5)
|
||
|
int slice_alf_chroma2_map_flag; // u(1)
|
||
|
int slice_pic_order_cnt_lsb; // u(v)
|
||
|
|
||
|
// @note
|
||
|
// Currently the structure does not reflect the entire Slice Header RBSP layout.
|
||
|
// It contains only the fields that are necessary to read from the NAL unit all the values
|
||
|
// necessary for the correct initialization of the AVCodecContext structure.
|
||
|
|
||
|
// @note
|
||
|
// If necessary, add the missing fields to the structure to reflect
|
||
|
// the contents of the entire NAL unit of the SPS type
|
||
|
|
||
|
} EVCParserSliceHeader;
|
||
|
|
||
|
// picture order count of the current picture
|
||
|
typedef struct EVCParserPoc {
|
||
|
int PicOrderCntVal; // current picture order count value
|
||
|
int prevPicOrderCntVal; // the picture order count of the previous Tid0 picture
|
||
|
int DocOffset; // the decoding order count of the previous picture
|
||
|
} EVCParserPoc;
|
||
|
|
||
|
typedef struct EVCParserContext {
|
||
|
//ParseContext pc;
|
||
|
EVCParserSPS *sps[EVC_MAX_SPS_COUNT];
|
||
|
EVCParserPPS *pps[EVC_MAX_PPS_COUNT];
|
||
|
|
||
|
EVCParserPoc poc;
|
||
|
|
||
|
int nuh_temporal_id; // the value of TemporalId (shall be the same for all VCL NAL units of an Access Unit)
|
||
|
int nalu_type; // the current NALU type
|
||
|
|
||
|
// Dimensions of the decoded video intended for presentation.
|
||
|
int width;
|
||
|
int height;
|
||
|
|
||
|
// Dimensions of the coded video.
|
||
|
int coded_width;
|
||
|
int coded_height;
|
||
|
|
||
|
// The format of the coded data, corresponds to enum AVPixelFormat
|
||
|
int format;
|
||
|
|
||
|
// AV_PICTURE_TYPE_I, EVC_SLICE_TYPE_P, AV_PICTURE_TYPE_B
|
||
|
int pict_type;
|
||
|
|
||
|
// Set by parser to 1 for key frames and 0 for non-key frames
|
||
|
int key_frame;
|
||
|
|
||
|
// Picture number incremented in presentation or output order.
|
||
|
// This corresponds to EVCEVCParserPoc::PicOrderCntVal
|
||
|
int output_picture_number;
|
||
|
|
||
|
// profile
|
||
|
// 0: FF_PROFILE_EVC_BASELINE
|
||
|
// 1: FF_PROFILE_EVC_MAIN
|
||
|
int profile;
|
||
|
|
||
|
// Framerate value in the compressed bitstream
|
||
|
AVRational framerate;
|
||
|
|
||
|
// Number of pictures in a group of pictures
|
||
|
int gop_size;
|
||
|
|
||
|
// Number of frames the decoded output will be delayed relative to the encoded input
|
||
|
int delay;
|
||
|
|
||
|
int parsed_extradata;
|
||
|
|
||
|
} EVCParserContext;
|
||
|
|
||
|
static inline int evc_get_nalu_type(const uint8_t *bits, int bits_size, void *logctx)
|
||
|
{
|
||
|
int unit_type_plus1 = 0;
|
||
|
|
||
|
if (bits_size >= EVC_NALU_HEADER_SIZE) {
|
||
|
unsigned char *p = (unsigned char *)bits;
|
||
|
// forbidden_zero_bit
|
||
|
if ((p[0] & 0x80) != 0) {
|
||
|
av_log(logctx, AV_LOG_ERROR, "Invalid NAL unit header\n");
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
// nal_unit_type
|
||
|
unit_type_plus1 = (p[0] >> 1) & 0x3F;
|
||
|
}
|
||
|
|
||
|
return unit_type_plus1 - 1;
|
||
|
}
|
||
|
|
||
|
static inline uint32_t evc_read_nal_unit_length(const uint8_t *bits, int bits_size, void *logctx)
|
||
|
{
|
||
|
uint32_t nalu_len = 0;
|
||
|
|
||
|
if (bits_size < EVC_NALU_LENGTH_PREFIX_SIZE) {
|
||
|
av_log(logctx, AV_LOG_ERROR, "Can't read NAL unit length\n");
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
nalu_len = AV_RB32(bits);
|
||
|
|
||
|
return nalu_len;
|
||
|
}
|
||
|
|
||
|
// nuh_temporal_id specifies a temporal identifier for the NAL unit
|
||
|
int ff_evc_get_temporal_id(const uint8_t *bits, int bits_size, void *logctx);
|
||
|
|
||
|
// @see ISO_IEC_23094-1 (7.3.2.1 SPS RBSP syntax)
|
||
|
EVCParserSPS *ff_evc_parse_sps(EVCParserContext *ctx, const uint8_t *bs, int bs_size);
|
||
|
|
||
|
// @see ISO_IEC_23094-1 (7.3.2.2 SPS RBSP syntax)
|
||
|
EVCParserPPS *ff_evc_parse_pps(EVCParserContext *ctx, const uint8_t *bs, int bs_size);
|
||
|
|
||
|
int ff_evc_parse_nal_unit(EVCParserContext *ctx, const uint8_t *buf, int buf_size, void *logctx);
|
||
|
|
||
|
#endif /* AVCODEC_EVC_PARSE_H */
|