mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
318 lines
10 KiB
318 lines
10 KiB
/* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
#include "libavutil/common.h" |
|
#include "libavutil/opt.h" |
|
|
|
#include "bsf.h" |
|
#include "cbs.h" |
|
#include "cbs_av1.h" |
|
|
|
enum { |
|
PASS, |
|
INSERT, |
|
REMOVE, |
|
}; |
|
|
|
typedef struct AV1MetadataContext { |
|
const AVClass *class; |
|
|
|
CodedBitstreamContext *cbc; |
|
CodedBitstreamFragment access_unit; |
|
|
|
int td; |
|
|
|
int color_primaries; |
|
int transfer_characteristics; |
|
int matrix_coefficients; |
|
|
|
int color_range; |
|
int chroma_sample_position; |
|
|
|
AVRational tick_rate; |
|
int num_ticks_per_picture; |
|
|
|
int delete_padding; |
|
} AV1MetadataContext; |
|
|
|
|
|
static int av1_metadata_update_sequence_header(AVBSFContext *bsf, |
|
AV1RawSequenceHeader *seq) |
|
{ |
|
AV1MetadataContext *ctx = bsf->priv_data; |
|
AV1RawColorConfig *clc = &seq->color_config; |
|
AV1RawTimingInfo *tim = &seq->timing_info; |
|
|
|
if (ctx->color_primaries >= 0 || |
|
ctx->transfer_characteristics >= 0 || |
|
ctx->matrix_coefficients >= 0) { |
|
if (!clc->color_description_present_flag) { |
|
clc->color_description_present_flag = 1; |
|
clc->color_primaries = AVCOL_PRI_UNSPECIFIED; |
|
clc->transfer_characteristics = AVCOL_TRC_UNSPECIFIED; |
|
clc->matrix_coefficients = AVCOL_SPC_UNSPECIFIED; |
|
} |
|
|
|
if (ctx->color_primaries >= 0) |
|
clc->color_primaries = ctx->color_primaries; |
|
if (ctx->transfer_characteristics >= 0) |
|
clc->transfer_characteristics = ctx->transfer_characteristics; |
|
if (ctx->matrix_coefficients >= 0) |
|
clc->matrix_coefficients = ctx->matrix_coefficients; |
|
} |
|
|
|
if (ctx->color_range >= 0) { |
|
if (clc->color_primaries == AVCOL_PRI_BT709 && |
|
clc->transfer_characteristics == AVCOL_TRC_IEC61966_2_1 && |
|
clc->matrix_coefficients == AVCOL_SPC_RGB) { |
|
av_log(bsf, AV_LOG_WARNING, "Warning: color_range cannot be set " |
|
"on RGB streams encoded in BT.709 sRGB.\n"); |
|
} else { |
|
clc->color_range = ctx->color_range; |
|
} |
|
} |
|
|
|
if (ctx->chroma_sample_position >= 0) { |
|
if (clc->mono_chrome || !clc->subsampling_x || !clc->subsampling_y) { |
|
av_log(bsf, AV_LOG_WARNING, "Warning: chroma_sample_position " |
|
"can only be set for 4:2:0 streams.\n"); |
|
} else { |
|
clc->chroma_sample_position = ctx->chroma_sample_position; |
|
} |
|
} |
|
|
|
if (ctx->tick_rate.num && ctx->tick_rate.den) { |
|
int num, den; |
|
|
|
av_reduce(&num, &den, ctx->tick_rate.num, ctx->tick_rate.den, |
|
UINT32_MAX > INT_MAX ? UINT32_MAX : INT_MAX); |
|
|
|
tim->time_scale = num; |
|
tim->num_units_in_display_tick = den; |
|
seq->timing_info_present_flag = 1; |
|
|
|
if (ctx->num_ticks_per_picture > 0) { |
|
tim->equal_picture_interval = 1; |
|
tim->num_ticks_per_picture_minus_1 = |
|
ctx->num_ticks_per_picture - 1; |
|
} |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int av1_metadata_filter(AVBSFContext *bsf, AVPacket *pkt) |
|
{ |
|
AV1MetadataContext *ctx = bsf->priv_data; |
|
CodedBitstreamFragment *frag = &ctx->access_unit; |
|
AV1RawOBU td, *obu; |
|
int err, i; |
|
|
|
err = ff_bsf_get_packet_ref(bsf, pkt); |
|
if (err < 0) |
|
return err; |
|
|
|
err = ff_cbs_read_packet(ctx->cbc, frag, pkt); |
|
if (err < 0) { |
|
av_log(bsf, AV_LOG_ERROR, "Failed to read packet.\n"); |
|
goto fail; |
|
} |
|
|
|
if (frag->nb_units == 0) { |
|
av_log(bsf, AV_LOG_ERROR, "No OBU in packet.\n"); |
|
err = AVERROR_INVALIDDATA; |
|
goto fail; |
|
} |
|
|
|
for (i = 0; i < frag->nb_units; i++) { |
|
if (frag->units[i].type == AV1_OBU_SEQUENCE_HEADER) { |
|
obu = frag->units[i].content; |
|
err = av1_metadata_update_sequence_header(bsf, &obu->obu.sequence_header); |
|
if (err < 0) |
|
goto fail; |
|
} |
|
} |
|
|
|
// If a Temporal Delimiter is present, it must be the first OBU. |
|
if (frag->units[0].type == AV1_OBU_TEMPORAL_DELIMITER) { |
|
if (ctx->td == REMOVE) |
|
ff_cbs_delete_unit(ctx->cbc, frag, 0); |
|
} else if (ctx->td == INSERT) { |
|
td = (AV1RawOBU) { |
|
.header.obu_type = AV1_OBU_TEMPORAL_DELIMITER, |
|
}; |
|
|
|
err = ff_cbs_insert_unit_content(ctx->cbc, frag, 0, AV1_OBU_TEMPORAL_DELIMITER, |
|
&td, NULL); |
|
if (err < 0) { |
|
av_log(bsf, AV_LOG_ERROR, "Failed to insert Temporal Delimiter.\n"); |
|
goto fail; |
|
} |
|
} |
|
|
|
if (ctx->delete_padding) { |
|
for (i = frag->nb_units - 1; i >= 0; i--) { |
|
if (frag->units[i].type == AV1_OBU_PADDING) { |
|
err = ff_cbs_delete_unit(ctx->cbc, frag, i); |
|
if (err < 0) { |
|
av_log(bsf, AV_LOG_ERROR, "Failed to delete Padding OBU.\n"); |
|
goto fail; |
|
} |
|
} |
|
} |
|
} |
|
|
|
err = ff_cbs_write_packet(ctx->cbc, pkt, frag); |
|
if (err < 0) { |
|
av_log(bsf, AV_LOG_ERROR, "Failed to write packet.\n"); |
|
goto fail; |
|
} |
|
|
|
err = 0; |
|
fail: |
|
ff_cbs_fragment_reset(ctx->cbc, frag); |
|
|
|
if (err < 0) |
|
av_packet_unref(pkt); |
|
|
|
return err; |
|
} |
|
|
|
static int av1_metadata_init(AVBSFContext *bsf) |
|
{ |
|
AV1MetadataContext *ctx = bsf->priv_data; |
|
CodedBitstreamFragment *frag = &ctx->access_unit; |
|
AV1RawOBU *obu; |
|
int err, i; |
|
|
|
err = ff_cbs_init(&ctx->cbc, AV_CODEC_ID_AV1, bsf); |
|
if (err < 0) |
|
return err; |
|
|
|
if (bsf->par_in->extradata) { |
|
err = ff_cbs_read_extradata(ctx->cbc, frag, bsf->par_in); |
|
if (err < 0) { |
|
av_log(bsf, AV_LOG_ERROR, "Failed to read extradata.\n"); |
|
goto fail; |
|
} |
|
|
|
for (i = 0; i < frag->nb_units; i++) { |
|
if (frag->units[i].type == AV1_OBU_SEQUENCE_HEADER) { |
|
obu = frag->units[i].content; |
|
err = av1_metadata_update_sequence_header(bsf, &obu->obu.sequence_header); |
|
if (err < 0) |
|
goto fail; |
|
} |
|
} |
|
|
|
err = ff_cbs_write_extradata(ctx->cbc, bsf->par_out, frag); |
|
if (err < 0) { |
|
av_log(bsf, AV_LOG_ERROR, "Failed to write extradata.\n"); |
|
goto fail; |
|
} |
|
} |
|
|
|
err = 0; |
|
fail: |
|
ff_cbs_fragment_reset(ctx->cbc, frag); |
|
return err; |
|
} |
|
|
|
static void av1_metadata_close(AVBSFContext *bsf) |
|
{ |
|
AV1MetadataContext *ctx = bsf->priv_data; |
|
|
|
ff_cbs_fragment_free(ctx->cbc, &ctx->access_unit); |
|
ff_cbs_close(&ctx->cbc); |
|
} |
|
|
|
#define OFFSET(x) offsetof(AV1MetadataContext, x) |
|
#define FLAGS (AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_BSF_PARAM) |
|
static const AVOption av1_metadata_options[] = { |
|
{ "td", "Temporal Delimiter OBU", |
|
OFFSET(td), AV_OPT_TYPE_INT, |
|
{ .i64 = PASS }, PASS, REMOVE, FLAGS, "td" }, |
|
{ "pass", NULL, 0, AV_OPT_TYPE_CONST, |
|
{ .i64 = PASS }, .flags = FLAGS, .unit = "td" }, |
|
{ "insert", NULL, 0, AV_OPT_TYPE_CONST, |
|
{ .i64 = INSERT }, .flags = FLAGS, .unit = "td" }, |
|
{ "remove", NULL, 0, AV_OPT_TYPE_CONST, |
|
{ .i64 = REMOVE }, .flags = FLAGS, .unit = "td" }, |
|
|
|
{ "color_primaries", "Set color primaries (section 6.4.2)", |
|
OFFSET(color_primaries), AV_OPT_TYPE_INT, |
|
{ .i64 = -1 }, -1, 255, FLAGS }, |
|
{ "transfer_characteristics", "Set transfer characteristics (section 6.4.2)", |
|
OFFSET(transfer_characteristics), AV_OPT_TYPE_INT, |
|
{ .i64 = -1 }, -1, 255, FLAGS }, |
|
{ "matrix_coefficients", "Set matrix coefficients (section 6.4.2)", |
|
OFFSET(matrix_coefficients), AV_OPT_TYPE_INT, |
|
{ .i64 = -1 }, -1, 255, FLAGS }, |
|
|
|
{ "color_range", "Set color range flag (section 6.4.2)", |
|
OFFSET(color_range), AV_OPT_TYPE_INT, |
|
{ .i64 = -1 }, -1, 1, FLAGS, "cr" }, |
|
{ "tv", "TV (limited) range", 0, AV_OPT_TYPE_CONST, |
|
{ .i64 = 0 }, .flags = FLAGS, .unit = "cr" }, |
|
{ "pc", "PC (full) range", 0, AV_OPT_TYPE_CONST, |
|
{ .i64 = 1 }, .flags = FLAGS, .unit = "cr" }, |
|
|
|
{ "chroma_sample_position", "Set chroma sample position (section 6.4.2)", |
|
OFFSET(chroma_sample_position), AV_OPT_TYPE_INT, |
|
{ .i64 = -1 }, -1, 3, FLAGS, "csp" }, |
|
{ "unknown", "Unknown chroma sample position", 0, AV_OPT_TYPE_CONST, |
|
{ .i64 = AV1_CSP_UNKNOWN }, .flags = FLAGS, .unit = "csp" }, |
|
{ "vertical", "Left chroma sample position", 0, AV_OPT_TYPE_CONST, |
|
{ .i64 = AV1_CSP_VERTICAL }, .flags = FLAGS, .unit = "csp" }, |
|
{ "colocated", "Top-left chroma sample position", 0, AV_OPT_TYPE_CONST, |
|
{ .i64 = AV1_CSP_COLOCATED }, .flags = FLAGS, .unit = "csp" }, |
|
|
|
{ "tick_rate", "Set display tick rate (num_units_in_display_tick / time_scale)", |
|
OFFSET(tick_rate), AV_OPT_TYPE_RATIONAL, |
|
{ .dbl = 0.0 }, 0, UINT_MAX, FLAGS }, |
|
{ "num_ticks_per_picture", "Set display ticks per picture for CFR streams", |
|
OFFSET(num_ticks_per_picture), AV_OPT_TYPE_INT, |
|
{ .i64 = -1 }, -1, INT_MAX, FLAGS }, |
|
|
|
{ "delete_padding", "Delete all Padding OBUs", |
|
OFFSET(delete_padding), AV_OPT_TYPE_BOOL, |
|
{ .i64 = 0 }, 0, 1, FLAGS}, |
|
|
|
{ NULL } |
|
}; |
|
|
|
static const AVClass av1_metadata_class = { |
|
.class_name = "av1_metadata_bsf", |
|
.item_name = av_default_item_name, |
|
.option = av1_metadata_options, |
|
.version = LIBAVUTIL_VERSION_INT, |
|
}; |
|
|
|
static const enum AVCodecID av1_metadata_codec_ids[] = { |
|
AV_CODEC_ID_AV1, AV_CODEC_ID_NONE, |
|
}; |
|
|
|
const AVBitStreamFilter ff_av1_metadata_bsf = { |
|
.name = "av1_metadata", |
|
.priv_data_size = sizeof(AV1MetadataContext), |
|
.priv_class = &av1_metadata_class, |
|
.init = &av1_metadata_init, |
|
.close = &av1_metadata_close, |
|
.filter = &av1_metadata_filter, |
|
.codec_ids = av1_metadata_codec_ids, |
|
};
|
|
|