mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
501 lines
15 KiB
501 lines
15 KiB
/* |
|
* AV1 helper functions for muxers |
|
* Copyright (c) 2018 James Almer <jamrial@gmail.com> |
|
* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
#include "libavutil/avassert.h" |
|
#include "libavutil/mem.h" |
|
#include "libavcodec/av1.h" |
|
#include "libavcodec/av1_parse.h" |
|
#include "libavcodec/defs.h" |
|
#include "libavcodec/put_bits.h" |
|
#include "av1.h" |
|
#include "avio.h" |
|
#include "avio_internal.h" |
|
|
|
static int av1_filter_obus(AVIOContext *pb, const uint8_t *buf, |
|
int size, int *offset) |
|
{ |
|
const uint8_t *start = buf, *end = buf + size; |
|
int off; |
|
enum { |
|
START_NOT_FOUND, |
|
START_FOUND, |
|
END_FOUND, |
|
OFFSET_IMPOSSIBLE, |
|
} state = START_NOT_FOUND; |
|
|
|
off = size = 0; |
|
while (buf < end) { |
|
int64_t obu_size; |
|
int start_pos, type, temporal_id, spatial_id; |
|
int len = parse_obu_header(buf, end - buf, &obu_size, &start_pos, |
|
&type, &temporal_id, &spatial_id); |
|
if (len < 0) |
|
return len; |
|
|
|
switch (type) { |
|
case AV1_OBU_TEMPORAL_DELIMITER: |
|
case AV1_OBU_REDUNDANT_FRAME_HEADER: |
|
case AV1_OBU_TILE_LIST: |
|
case AV1_OBU_PADDING: |
|
if (state == START_FOUND) |
|
state = END_FOUND; |
|
break; |
|
default: |
|
if (state == START_NOT_FOUND) { |
|
off = buf - start; |
|
state = START_FOUND; |
|
} else if (state == END_FOUND) { |
|
state = OFFSET_IMPOSSIBLE; |
|
} |
|
if (pb) |
|
avio_write(pb, buf, len); |
|
size += len; |
|
break; |
|
} |
|
buf += len; |
|
} |
|
|
|
if (offset) |
|
*offset = state != OFFSET_IMPOSSIBLE ? off : -1; |
|
|
|
return size; |
|
} |
|
|
|
int ff_av1_filter_obus(AVIOContext *pb, const uint8_t *buf, int size) |
|
{ |
|
return av1_filter_obus(pb, buf, size, NULL); |
|
} |
|
|
|
int ff_av1_filter_obus_buf(const uint8_t *in, uint8_t **out, |
|
int *size, int *offset) |
|
{ |
|
FFIOContext pb; |
|
uint8_t *buf; |
|
int len, off, ret; |
|
|
|
len = ret = av1_filter_obus(NULL, in, *size, &off); |
|
if (ret < 0) { |
|
return ret; |
|
} |
|
if (off >= 0) { |
|
*out = (uint8_t *)in; |
|
*size = len; |
|
*offset = off; |
|
|
|
return 0; |
|
} |
|
|
|
buf = av_malloc(len + AV_INPUT_BUFFER_PADDING_SIZE); |
|
if (!buf) |
|
return AVERROR(ENOMEM); |
|
|
|
ffio_init_context(&pb, buf, len, 1, NULL, NULL, NULL, NULL); |
|
|
|
ret = av1_filter_obus(&pb.pub, in, *size, NULL); |
|
av_assert1(ret == len); |
|
|
|
memset(buf + len, 0, AV_INPUT_BUFFER_PADDING_SIZE); |
|
|
|
*out = buf; |
|
*size = len; |
|
*offset = 0; |
|
|
|
return 0; |
|
} |
|
|
|
static inline void uvlc(GetBitContext *gb) |
|
{ |
|
int leading_zeros = 0; |
|
|
|
while (get_bits_left(gb)) { |
|
if (get_bits1(gb)) |
|
break; |
|
leading_zeros++; |
|
} |
|
|
|
if (leading_zeros >= 32) |
|
return; |
|
|
|
skip_bits_long(gb, leading_zeros); |
|
} |
|
|
|
static int parse_color_config(AV1SequenceParameters *seq_params, GetBitContext *gb) |
|
{ |
|
int twelve_bit = 0; |
|
int high_bitdepth = get_bits1(gb); |
|
if (seq_params->profile == AV_PROFILE_AV1_PROFESSIONAL && high_bitdepth) |
|
twelve_bit = get_bits1(gb); |
|
|
|
seq_params->bitdepth = 8 + (high_bitdepth * 2) + (twelve_bit * 2); |
|
|
|
if (seq_params->profile == AV_PROFILE_AV1_HIGH) |
|
seq_params->monochrome = 0; |
|
else |
|
seq_params->monochrome = get_bits1(gb); |
|
|
|
seq_params->color_description_present_flag = get_bits1(gb); |
|
if (seq_params->color_description_present_flag) { |
|
seq_params->color_primaries = get_bits(gb, 8); |
|
seq_params->transfer_characteristics = get_bits(gb, 8); |
|
seq_params->matrix_coefficients = get_bits(gb, 8); |
|
} else { |
|
seq_params->color_primaries = AVCOL_PRI_UNSPECIFIED; |
|
seq_params->transfer_characteristics = AVCOL_TRC_UNSPECIFIED; |
|
seq_params->matrix_coefficients = AVCOL_SPC_UNSPECIFIED; |
|
} |
|
|
|
if (seq_params->monochrome) { |
|
seq_params->color_range = get_bits1(gb); |
|
seq_params->chroma_subsampling_x = 1; |
|
seq_params->chroma_subsampling_y = 1; |
|
seq_params->chroma_sample_position = 0; |
|
return 0; |
|
} else if (seq_params->color_primaries == AVCOL_PRI_BT709 && |
|
seq_params->transfer_characteristics == AVCOL_TRC_IEC61966_2_1 && |
|
seq_params->matrix_coefficients == AVCOL_SPC_RGB) { |
|
seq_params->chroma_subsampling_x = 0; |
|
seq_params->chroma_subsampling_y = 0; |
|
} else { |
|
seq_params->color_range = get_bits1(gb); |
|
|
|
if (seq_params->profile == AV_PROFILE_AV1_MAIN) { |
|
seq_params->chroma_subsampling_x = 1; |
|
seq_params->chroma_subsampling_y = 1; |
|
} else if (seq_params->profile == AV_PROFILE_AV1_HIGH) { |
|
seq_params->chroma_subsampling_x = 0; |
|
seq_params->chroma_subsampling_y = 0; |
|
} else { |
|
if (twelve_bit) { |
|
seq_params->chroma_subsampling_x = get_bits1(gb); |
|
if (seq_params->chroma_subsampling_x) |
|
seq_params->chroma_subsampling_y = get_bits1(gb); |
|
else |
|
seq_params->chroma_subsampling_y = 0; |
|
} else { |
|
seq_params->chroma_subsampling_x = 1; |
|
seq_params->chroma_subsampling_y = 0; |
|
} |
|
} |
|
if (seq_params->chroma_subsampling_x && seq_params->chroma_subsampling_y) |
|
seq_params->chroma_sample_position = get_bits(gb, 2); |
|
} |
|
|
|
skip_bits1(gb); // separate_uv_delta_q |
|
|
|
return 0; |
|
} |
|
|
|
static int parse_sequence_header(AV1SequenceParameters *seq_params, const uint8_t *buf, int size) |
|
{ |
|
GetBitContext gb; |
|
int reduced_still_picture_header; |
|
int frame_width_bits_minus_1, frame_height_bits_minus_1; |
|
int size_bits, ret; |
|
|
|
size_bits = get_obu_bit_length(buf, size, AV1_OBU_SEQUENCE_HEADER); |
|
if (size_bits < 0) |
|
return size_bits; |
|
|
|
ret = init_get_bits(&gb, buf, size_bits); |
|
if (ret < 0) |
|
return ret; |
|
|
|
memset(seq_params, 0, sizeof(*seq_params)); |
|
|
|
seq_params->profile = get_bits(&gb, 3); |
|
|
|
skip_bits1(&gb); // still_picture |
|
reduced_still_picture_header = get_bits1(&gb); |
|
|
|
if (reduced_still_picture_header) { |
|
seq_params->level = get_bits(&gb, 5); |
|
seq_params->tier = 0; |
|
} else { |
|
int initial_display_delay_present_flag, operating_points_cnt_minus_1; |
|
int decoder_model_info_present_flag, buffer_delay_length_minus_1; |
|
|
|
if (get_bits1(&gb)) { // timing_info_present_flag |
|
skip_bits_long(&gb, 32); // num_units_in_display_tick |
|
skip_bits_long(&gb, 32); // time_scale |
|
|
|
if (get_bits1(&gb)) // equal_picture_interval |
|
uvlc(&gb); // num_ticks_per_picture_minus_1 |
|
|
|
decoder_model_info_present_flag = get_bits1(&gb); |
|
if (decoder_model_info_present_flag) { |
|
buffer_delay_length_minus_1 = get_bits(&gb, 5); |
|
skip_bits_long(&gb, 32); // num_units_in_decoding_tick |
|
skip_bits(&gb, 10); // buffer_removal_time_length_minus_1 (5) |
|
// frame_presentation_time_length_minus_1 (5) |
|
} |
|
} else |
|
decoder_model_info_present_flag = 0; |
|
|
|
initial_display_delay_present_flag = get_bits1(&gb); |
|
|
|
operating_points_cnt_minus_1 = get_bits(&gb, 5); |
|
for (int i = 0; i <= operating_points_cnt_minus_1; i++) { |
|
int seq_level_idx, seq_tier; |
|
|
|
skip_bits(&gb, 12); // operating_point_idc |
|
seq_level_idx = get_bits(&gb, 5); |
|
|
|
if (seq_level_idx > 7) |
|
seq_tier = get_bits1(&gb); |
|
else |
|
seq_tier = 0; |
|
|
|
if (decoder_model_info_present_flag) { |
|
if (get_bits1(&gb)) { // decoder_model_present_for_this_op |
|
skip_bits_long(&gb, buffer_delay_length_minus_1 + 1); // decoder_buffer_delay |
|
skip_bits_long(&gb, buffer_delay_length_minus_1 + 1); // encoder_buffer_delay |
|
skip_bits1(&gb); // low_delay_mode_flag |
|
} |
|
} |
|
|
|
if (initial_display_delay_present_flag) { |
|
if (get_bits1(&gb)) // initial_display_delay_present_for_this_op |
|
skip_bits(&gb, 4); // initial_display_delay_minus_1 |
|
} |
|
|
|
if (i == 0) { |
|
seq_params->level = seq_level_idx; |
|
seq_params->tier = seq_tier; |
|
} |
|
} |
|
} |
|
|
|
frame_width_bits_minus_1 = get_bits(&gb, 4); |
|
frame_height_bits_minus_1 = get_bits(&gb, 4); |
|
|
|
skip_bits(&gb, frame_width_bits_minus_1 + 1); // max_frame_width_minus_1 |
|
skip_bits(&gb, frame_height_bits_minus_1 + 1); // max_frame_height_minus_1 |
|
|
|
if (!reduced_still_picture_header) { |
|
if (get_bits1(&gb)) // frame_id_numbers_present_flag |
|
skip_bits(&gb, 7); // delta_frame_id_length_minus_2 (4), additional_frame_id_length_minus_1 (3) |
|
} |
|
|
|
skip_bits(&gb, 3); // use_128x128_superblock (1), enable_filter_intra (1), enable_intra_edge_filter (1) |
|
|
|
if (!reduced_still_picture_header) { |
|
int enable_order_hint, seq_force_screen_content_tools; |
|
|
|
skip_bits(&gb, 4); // enable_interintra_compound (1), enable_masked_compound (1) |
|
// enable_warped_motion (1), enable_dual_filter (1) |
|
|
|
enable_order_hint = get_bits1(&gb); |
|
if (enable_order_hint) |
|
skip_bits(&gb, 2); // enable_jnt_comp (1), enable_ref_frame_mvs (1) |
|
|
|
if (get_bits1(&gb)) // seq_choose_screen_content_tools |
|
seq_force_screen_content_tools = 2; |
|
else |
|
seq_force_screen_content_tools = get_bits1(&gb); |
|
|
|
if (seq_force_screen_content_tools) { |
|
if (!get_bits1(&gb)) // seq_choose_integer_mv |
|
skip_bits1(&gb); // seq_force_integer_mv |
|
} |
|
|
|
if (enable_order_hint) |
|
skip_bits(&gb, 3); // order_hint_bits_minus_1 |
|
} |
|
|
|
skip_bits(&gb, 3); // enable_superres (1), enable_cdef (1), enable_restoration (1) |
|
|
|
parse_color_config(seq_params, &gb); |
|
|
|
skip_bits1(&gb); // film_grain_params_present |
|
|
|
if (get_bits_left(&gb)) |
|
return AVERROR_INVALIDDATA; |
|
|
|
return 0; |
|
} |
|
|
|
int ff_av1_parse_seq_header(AV1SequenceParameters *seq, const uint8_t *buf, int size) |
|
{ |
|
int is_av1c; |
|
|
|
if (size <= 0) |
|
return AVERROR_INVALIDDATA; |
|
|
|
is_av1c = !!(buf[0] & 0x80); |
|
if (is_av1c) { |
|
GetBitContext gb; |
|
int ret, version = buf[0] & 0x7F; |
|
|
|
if (version != 1 || size < 4) |
|
return AVERROR_INVALIDDATA; |
|
|
|
ret = init_get_bits8(&gb, buf, 4); |
|
if (ret < 0) |
|
return ret; |
|
|
|
memset(seq, 0, sizeof(*seq)); |
|
|
|
skip_bits(&gb, 8); |
|
seq->profile = get_bits(&gb, 3); |
|
seq->level = get_bits(&gb, 5); |
|
seq->tier = get_bits(&gb, 1); |
|
seq->bitdepth = get_bits(&gb, 1) * 2 + 8; |
|
seq->bitdepth += get_bits(&gb, 1) * 2; |
|
seq->monochrome = get_bits(&gb, 1); |
|
seq->chroma_subsampling_x = get_bits(&gb, 1); |
|
seq->chroma_subsampling_y = get_bits(&gb, 1); |
|
seq->chroma_sample_position = get_bits(&gb, 2); |
|
seq->color_primaries = AVCOL_PRI_UNSPECIFIED; |
|
seq->transfer_characteristics = AVCOL_TRC_UNSPECIFIED; |
|
seq->matrix_coefficients = AVCOL_SPC_UNSPECIFIED; |
|
|
|
size -= 4; |
|
buf += 4; |
|
} |
|
|
|
while (size > 0) { |
|
int64_t obu_size; |
|
int start_pos, type, temporal_id, spatial_id; |
|
int len = parse_obu_header(buf, size, &obu_size, &start_pos, |
|
&type, &temporal_id, &spatial_id); |
|
if (len < 0) |
|
return len; |
|
|
|
switch (type) { |
|
case AV1_OBU_SEQUENCE_HEADER: |
|
if (!obu_size) |
|
return AVERROR_INVALIDDATA; |
|
|
|
return parse_sequence_header(seq, buf + start_pos, obu_size); |
|
default: |
|
break; |
|
} |
|
size -= len; |
|
buf += len; |
|
} |
|
|
|
return is_av1c ? 0 : AVERROR_INVALIDDATA; |
|
} |
|
|
|
int ff_isom_write_av1c(AVIOContext *pb, const uint8_t *buf, int size, |
|
int write_seq_header) |
|
{ |
|
AVIOContext *meta_pb; |
|
AV1SequenceParameters seq_params; |
|
PutBitContext pbc; |
|
uint8_t header[4], *meta; |
|
const uint8_t *seq; |
|
int ret, nb_seq = 0, seq_size, meta_size; |
|
|
|
if (size <= 0) |
|
return AVERROR_INVALIDDATA; |
|
|
|
if (buf[0] & 0x80) { |
|
// first bit is nonzero, the passed data does not consist purely of |
|
// OBUs. Expect that the data is already in AV1CodecConfigurationRecord |
|
// format. |
|
int config_record_version = buf[0] & 0x7f; |
|
if (config_record_version != 1 || size < 4) { |
|
return AVERROR_INVALIDDATA; |
|
} |
|
|
|
avio_write(pb, buf, size); |
|
|
|
return 0; |
|
} |
|
|
|
ret = avio_open_dyn_buf(&meta_pb); |
|
if (ret < 0) |
|
return ret; |
|
|
|
while (size > 0) { |
|
int64_t obu_size; |
|
int start_pos, type, temporal_id, spatial_id; |
|
int len = parse_obu_header(buf, size, &obu_size, &start_pos, |
|
&type, &temporal_id, &spatial_id); |
|
if (len < 0) { |
|
ret = len; |
|
goto fail; |
|
} |
|
|
|
switch (type) { |
|
case AV1_OBU_SEQUENCE_HEADER: |
|
nb_seq++; |
|
if (!obu_size || nb_seq > 1) { |
|
ret = AVERROR_INVALIDDATA; |
|
goto fail; |
|
} |
|
ret = parse_sequence_header(&seq_params, buf + start_pos, obu_size); |
|
if (ret < 0) |
|
goto fail; |
|
|
|
seq = buf; |
|
seq_size = len; |
|
break; |
|
case AV1_OBU_METADATA: |
|
if (!obu_size) { |
|
ret = AVERROR_INVALIDDATA; |
|
goto fail; |
|
} |
|
avio_write(meta_pb, buf, len); |
|
break; |
|
default: |
|
break; |
|
} |
|
size -= len; |
|
buf += len; |
|
} |
|
|
|
if (!nb_seq) { |
|
ret = AVERROR_INVALIDDATA; |
|
goto fail; |
|
} |
|
|
|
init_put_bits(&pbc, header, sizeof(header)); |
|
|
|
put_bits(&pbc, 1, 1); // marker |
|
put_bits(&pbc, 7, 1); // version |
|
put_bits(&pbc, 3, seq_params.profile); |
|
put_bits(&pbc, 5, seq_params.level); |
|
put_bits(&pbc, 1, seq_params.tier); |
|
put_bits(&pbc, 1, seq_params.bitdepth > 8); |
|
put_bits(&pbc, 1, seq_params.bitdepth == 12); |
|
put_bits(&pbc, 1, seq_params.monochrome); |
|
put_bits(&pbc, 1, seq_params.chroma_subsampling_x); |
|
put_bits(&pbc, 1, seq_params.chroma_subsampling_y); |
|
put_bits(&pbc, 2, seq_params.chroma_sample_position); |
|
put_bits(&pbc, 8, 0); // padding |
|
flush_put_bits(&pbc); |
|
|
|
avio_write(pb, header, sizeof(header)); |
|
if (write_seq_header) { |
|
avio_write(pb, seq, seq_size); |
|
} |
|
|
|
meta_size = avio_get_dyn_buf(meta_pb, &meta); |
|
if (meta_size) |
|
avio_write(pb, meta, meta_size); |
|
|
|
fail: |
|
ffio_free_dyn_buf(&meta_pb); |
|
|
|
return ret; |
|
}
|
|
|