mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
491 lines
17 KiB
491 lines
17 KiB
/* |
|
* H.266 encoding using the VVenC library |
|
* |
|
* Copyright (C) 2022, Thomas Siedel |
|
* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
#include <vvenc/vvenc.h> |
|
#include <vvenc/vvencCfg.h> |
|
#include <vvenc/version.h> |
|
|
|
#include "libavutil/avstring.h" |
|
#include "libavutil/avutil.h" |
|
#include "libavutil/common.h" |
|
#include "libavutil/frame.h" |
|
#include "libavutil/imgutils.h" |
|
#include "libavutil/log.h" |
|
#include "libavutil/mem.h" |
|
#include "libavutil/pixdesc.h" |
|
#include "libavutil/opt.h" |
|
|
|
#include "avcodec.h" |
|
#include "codec_internal.h" |
|
#include "encode.h" |
|
#include "internal.h" |
|
#include "packet_internal.h" |
|
#include "profiles.h" |
|
|
|
#define VVENC_VERSION_INT AV_VERSION_INT(VVENC_VERSION_MAJOR, \ |
|
VVENC_VERSION_MINOR, \ |
|
VVENC_VERSION_PATCH) |
|
|
|
typedef struct VVenCContext { |
|
AVClass *class; |
|
vvencEncoder *encoder; |
|
vvencAccessUnit *au; |
|
bool encode_done; |
|
int preset; |
|
int qp; |
|
int qpa; |
|
int intra_refresh_sec; |
|
char *level; |
|
int tier; |
|
char *stats; |
|
AVDictionary *vvenc_opts; |
|
} VVenCContext; |
|
|
|
static void vvenc_log_callback(void *ctx, int level, |
|
const char *fmt, va_list args) |
|
{ |
|
vvenc_config params; |
|
vvencEncoder *encoder = ctx; |
|
if (encoder) { |
|
vvenc_config_default(¶ms); |
|
vvenc_get_config(encoder, ¶ms); |
|
if ((int)params.m_verbosity >= level) |
|
vfprintf(level == 1 ? stderr : stdout, fmt, args); |
|
} |
|
} |
|
|
|
static void vvenc_set_verbository(vvenc_config *params) |
|
{ |
|
int loglevel = av_log_get_level(); |
|
params->m_verbosity = VVENC_SILENT; |
|
if (loglevel >= AV_LOG_DEBUG) |
|
params->m_verbosity = VVENC_DETAILS; |
|
else if (loglevel >= AV_LOG_VERBOSE) |
|
params->m_verbosity = VVENC_NOTICE; |
|
else if (loglevel >= AV_LOG_INFO) |
|
params->m_verbosity = VVENC_WARNING; |
|
} |
|
|
|
static void vvenc_set_pic_format(AVCodecContext *avctx, vvenc_config *params) |
|
{ |
|
params->m_internChromaFormat = VVENC_CHROMA_420; |
|
params->m_inputBitDepth[0] = 10; |
|
} |
|
|
|
static void vvenc_set_color_format(AVCodecContext *avctx, vvenc_config *params) |
|
{ |
|
if (avctx->color_primaries != AVCOL_PRI_UNSPECIFIED) |
|
params->m_colourPrimaries = (int) avctx->color_primaries; |
|
if (avctx->colorspace != AVCOL_SPC_UNSPECIFIED) |
|
params->m_matrixCoefficients = (int) avctx->colorspace; |
|
if (avctx->color_trc != AVCOL_TRC_UNSPECIFIED) { |
|
params->m_transferCharacteristics = (int) avctx->color_trc; |
|
|
|
if (avctx->color_trc == AVCOL_TRC_SMPTE2084) |
|
params->m_HdrMode = (avctx->color_primaries == AVCOL_PRI_BT2020) ? |
|
VVENC_HDR_PQ_BT2020 : VVENC_HDR_PQ; |
|
else if (avctx->color_trc == AVCOL_TRC_BT2020_10 || avctx->color_trc == AVCOL_TRC_ARIB_STD_B67) |
|
params->m_HdrMode = (avctx->color_trc == AVCOL_TRC_BT2020_10 || |
|
avctx->color_primaries == AVCOL_PRI_BT2020 || |
|
avctx->colorspace == AVCOL_SPC_BT2020_NCL || |
|
avctx->colorspace == AVCOL_SPC_BT2020_CL) ? |
|
VVENC_HDR_HLG_BT2020 : VVENC_HDR_HLG; |
|
} |
|
|
|
if (params->m_HdrMode == VVENC_HDR_OFF && |
|
(avctx->color_primaries != AVCOL_PRI_UNSPECIFIED || avctx->colorspace != AVCOL_SPC_UNSPECIFIED)) { |
|
params->m_vuiParametersPresent = 1; |
|
params->m_colourDescriptionPresent = true; |
|
} |
|
} |
|
|
|
static void vvenc_set_framerate(AVCodecContext *avctx, vvenc_config *params) |
|
{ |
|
if (avctx->framerate.num > 0 && avctx->framerate.den > 0) { |
|
params->m_FrameRate = avctx->framerate.num; |
|
params->m_FrameScale = avctx->framerate.den; |
|
} else { |
|
params->m_FrameRate = avctx->time_base.den; |
|
params->m_FrameScale = avctx->time_base.num; |
|
} |
|
|
|
FF_DISABLE_DEPRECATION_WARNINGS |
|
|
|
#if FF_API_TICKS_PER_FRAME |
|
if (avctx->ticks_per_frame == 1) { |
|
#endif |
|
params->m_TicksPerSecond = -1; /* auto mode for ticks per frame = 1 */ |
|
#if FF_API_TICKS_PER_FRAME |
|
} else { |
|
params->m_TicksPerSecond = |
|
ceil((avctx->time_base.den / (double) avctx->time_base.num) * |
|
(double) avctx->ticks_per_frame); |
|
} |
|
#endif |
|
FF_ENABLE_DEPRECATION_WARNINGS |
|
} |
|
|
|
static int vvenc_parse_vvenc_params(AVCodecContext *avctx, vvenc_config *params) |
|
{ |
|
VVenCContext *s = avctx->priv_data; |
|
const AVDictionaryEntry *en = NULL; |
|
int parse_ret; |
|
int ret = 0; |
|
|
|
while ((en = av_dict_iterate(s->vvenc_opts, en))) { |
|
av_log(avctx, AV_LOG_DEBUG, "vvenc_set_param: '%s:%s'\n", en->key, |
|
en->value); |
|
parse_ret = vvenc_set_param(params, en->key, en->value); |
|
switch (parse_ret) { |
|
case VVENC_PARAM_BAD_NAME: |
|
av_log(avctx, AV_LOG_ERROR, "Unknown vvenc option: %s.\n", en->key); |
|
ret = AVERROR(EINVAL); |
|
break; |
|
case VVENC_PARAM_BAD_VALUE: |
|
av_log(avctx, AV_LOG_ERROR, "Invalid vvenc value for %s: %s.\n", en->key, en->value); |
|
ret = AVERROR(EINVAL); |
|
break; |
|
default: |
|
break; |
|
} |
|
|
|
if (!av_strcasecmp(en->key, "rcstatsfile")) { |
|
av_log(avctx, AV_LOG_ERROR, "vvenc-params 2pass option 'rcstatsfile' " |
|
"not available. Use option 'passlogfile'\n"); |
|
ret = AVERROR(EINVAL); |
|
} |
|
if (!av_strcasecmp(en->key, "passes") || !av_strcasecmp(en->key, "pass")) { |
|
av_log(avctx, AV_LOG_ERROR, "vvenc-params 2pass option '%s' " |
|
"not available. Use option 'pass'\n", en->key); |
|
ret = AVERROR(EINVAL); |
|
} |
|
} |
|
return ret; |
|
} |
|
|
|
static int vvenc_set_rc_mode(AVCodecContext *avctx, vvenc_config *params) |
|
{ |
|
params->m_RCNumPasses = 1; |
|
if ((avctx->flags & AV_CODEC_FLAG_PASS1 || avctx->flags & AV_CODEC_FLAG_PASS2)) { |
|
if (!avctx->bit_rate) { |
|
av_log(avctx, AV_LOG_ERROR, "A bitrate must be set to use two pass mode.\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
params->m_RCNumPasses = 2; |
|
if (avctx->flags & AV_CODEC_FLAG_PASS1) |
|
params->m_RCPass = 1; |
|
else |
|
params->m_RCPass = 2; |
|
} |
|
|
|
if (avctx->rc_max_rate) { |
|
#if VVENC_VERSION_INT >= AV_VERSION_INT(1,8,0) |
|
params->m_RCMaxBitrate = avctx->rc_max_rate; |
|
#endif |
|
|
|
#if VVENC_VERSION_INT < AV_VERSION_INT(1,11,0) |
|
/* rc_max_rate without a bit_rate enables capped CQF mode. |
|
(QP + subj. optimization + max. bitrate) */ |
|
if (!avctx->bit_rate) { |
|
av_log(avctx, AV_LOG_ERROR, "Capped Constant Quality Factor mode (capped CQF) " |
|
"needs at least vvenc version >= 1.11.0 (current version %s)\n", vvenc_get_version()); |
|
return AVERROR(EINVAL); |
|
} |
|
#endif |
|
} |
|
return 0; |
|
} |
|
|
|
static int vvenc_init_extradata(AVCodecContext *avctx, VVenCContext *s) |
|
{ |
|
int ret; |
|
if (avctx->flags & AV_CODEC_FLAG_GLOBAL_HEADER) { |
|
ret = vvenc_get_headers(s->encoder, s->au); |
|
if (0 != ret) { |
|
av_log(avctx, AV_LOG_ERROR, "cannot get (SPS,PPS) headers: %s\n", |
|
vvenc_get_last_error(s->encoder)); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
if (s->au->payloadUsedSize <= 0) { |
|
return AVERROR_INVALIDDATA; |
|
} |
|
|
|
avctx->extradata_size = s->au->payloadUsedSize; |
|
avctx->extradata = av_mallocz(avctx->extradata_size + AV_INPUT_BUFFER_PADDING_SIZE); |
|
if (!avctx->extradata) { |
|
return AVERROR(ENOMEM); |
|
} |
|
|
|
memcpy(avctx->extradata, s->au->payload, avctx->extradata_size); |
|
} |
|
return 0; |
|
} |
|
|
|
static av_cold int vvenc_init(AVCodecContext *avctx) |
|
{ |
|
int ret; |
|
int framerate; |
|
VVenCContext *s = avctx->priv_data; |
|
vvenc_config params; |
|
vvencPresetMode preset = (vvencPresetMode) s->preset; |
|
|
|
if (avctx->flags & AV_CODEC_FLAG_INTERLACED_DCT) { |
|
av_log(avctx, AV_LOG_ERROR, "interlaced not supported\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
vvenc_config_default(¶ms); |
|
|
|
if (avctx->framerate.num > 0 && avctx->framerate.den > 0) |
|
framerate = avctx->framerate.num / avctx->framerate.den; |
|
else |
|
framerate = avctx->time_base.den / avctx->time_base.num; |
|
|
|
vvenc_init_default(¶ms, avctx->width, avctx->height, framerate, |
|
avctx->bit_rate, s->qp, preset); |
|
|
|
vvenc_set_verbository(¶ms); |
|
|
|
if (avctx->thread_count > 0) |
|
params.m_numThreads = avctx->thread_count; |
|
|
|
/* GOP settings (IDR/CRA) */ |
|
if (avctx->flags & AV_CODEC_FLAG_CLOSED_GOP) |
|
params.m_DecodingRefreshType = VVENC_DRT_IDR; |
|
|
|
if (avctx->gop_size == 1) { |
|
params.m_GOPSize = 1; |
|
params.m_IntraPeriod = 1; |
|
} else |
|
params.m_IntraPeriodSec = s->intra_refresh_sec; |
|
|
|
params.m_AccessUnitDelimiter = true; |
|
params.m_usePerceptQPA = s->qpa; |
|
params.m_levelTier = (vvencTier) s->tier; |
|
|
|
if (avctx->level > 0) |
|
params.m_level = (vvencLevel)avctx->level; |
|
|
|
if (s->level) { |
|
if (VVENC_PARAM_BAD_VALUE == vvenc_set_param(¶ms, "level", s->level)) { |
|
av_log(avctx, AV_LOG_ERROR, "Invalid level_idc: %s.\n", s->level); |
|
return AVERROR(EINVAL); |
|
} |
|
} |
|
|
|
vvenc_set_framerate(avctx, ¶ms); |
|
|
|
vvenc_set_pic_format(avctx, ¶ms); |
|
|
|
vvenc_set_color_format(avctx, ¶ms); |
|
|
|
ret = vvenc_parse_vvenc_params(avctx, ¶ms); |
|
if (ret != 0) |
|
return ret; |
|
|
|
ret = vvenc_set_rc_mode(avctx, ¶ms); |
|
if (ret != 0) |
|
return ret; |
|
|
|
s->encoder = vvenc_encoder_create(); |
|
if (!s->encoder) { |
|
av_log(avctx, AV_LOG_ERROR, "cannot create libvvenc encoder\n"); |
|
return AVERROR(ENOMEM); |
|
} |
|
|
|
vvenc_set_msg_callback(¶ms, s->encoder, vvenc_log_callback); |
|
ret = vvenc_encoder_open(s->encoder, ¶ms); |
|
if (ret != 0) { |
|
av_log(avctx, AV_LOG_ERROR, "cannot open libvvenc encoder: %s\n", |
|
vvenc_get_last_error(s->encoder)); |
|
return AVERROR_EXTERNAL; |
|
} |
|
|
|
vvenc_get_config(s->encoder, ¶ms); /* get the adapted config */ |
|
|
|
av_log(avctx, AV_LOG_INFO, "libvvenc version: %s\n", vvenc_get_version()); |
|
if (av_log_get_level() >= AV_LOG_VERBOSE) |
|
av_log(avctx, AV_LOG_INFO, "%s\n", vvenc_get_config_as_string(¶ms, params.m_verbosity)); |
|
|
|
if (params.m_RCNumPasses == 2) { |
|
ret = vvenc_init_pass(s->encoder, params.m_RCPass - 1, s->stats); |
|
if (ret != 0) { |
|
av_log(avctx, AV_LOG_ERROR, "cannot init pass %d: %s\n", params.m_RCPass, |
|
vvenc_get_last_error(s->encoder)); |
|
return AVERROR_EXTERNAL; |
|
} |
|
} |
|
|
|
s->au = vvenc_accessUnit_alloc(); |
|
if (!s->au) { |
|
av_log(avctx, AV_LOG_FATAL, "cannot allocate memory for AU payload\n"); |
|
return AVERROR(ENOMEM); |
|
} |
|
vvenc_accessUnit_alloc_payload(s->au, avctx->width * avctx->height); |
|
if (!s->au->payload) { |
|
av_log(avctx, AV_LOG_FATAL, "cannot allocate payload memory of size %d\n", |
|
avctx->width * avctx->height); |
|
return AVERROR(ENOMEM); |
|
} |
|
|
|
ret = vvenc_init_extradata(avctx, s); |
|
if (ret != 0) |
|
return ret; |
|
|
|
s->encode_done = false; |
|
return 0; |
|
} |
|
|
|
static av_cold int vvenc_close(AVCodecContext *avctx) |
|
{ |
|
VVenCContext *s = avctx->priv_data; |
|
|
|
if (s->au) |
|
vvenc_accessUnit_free(s->au, true); |
|
|
|
if (s->encoder) { |
|
vvenc_print_summary(s->encoder); |
|
|
|
if (0 != vvenc_encoder_close(s->encoder)) |
|
return AVERROR_EXTERNAL; |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static av_cold int vvenc_frame(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *frame, |
|
int *got_packet) |
|
{ |
|
VVenCContext *s = avctx->priv_data; |
|
vvencYUVBuffer *pyuvbuf; |
|
vvencYUVBuffer yuvbuf; |
|
int ret; |
|
|
|
pyuvbuf = NULL; |
|
if (frame) { |
|
vvenc_YUVBuffer_default(&yuvbuf); |
|
yuvbuf.planes[0].ptr = (int16_t *) frame->data[0]; |
|
yuvbuf.planes[1].ptr = (int16_t *) frame->data[1]; |
|
yuvbuf.planes[2].ptr = (int16_t *) frame->data[2]; |
|
|
|
yuvbuf.planes[0].width = frame->width; |
|
yuvbuf.planes[0].height = frame->height; |
|
yuvbuf.planes[0].stride = frame->linesize[0] >> 1; /* stride is used in 16bit samples in vvenc */ |
|
|
|
yuvbuf.planes[1].width = frame->width >> 1; |
|
yuvbuf.planes[1].height = frame->height >> 1; |
|
yuvbuf.planes[1].stride = frame->linesize[1] >> 1; |
|
|
|
yuvbuf.planes[2].width = frame->width >> 1; |
|
yuvbuf.planes[2].height = frame->height >> 1; |
|
yuvbuf.planes[2].stride = frame->linesize[2] >> 1; |
|
|
|
yuvbuf.cts = frame->pts; |
|
yuvbuf.ctsValid = true; |
|
pyuvbuf = &yuvbuf; |
|
} |
|
|
|
if (!s->encode_done) { |
|
if (vvenc_encode(s->encoder, pyuvbuf, s->au, &s->encode_done) != 0) |
|
return AVERROR_EXTERNAL; |
|
} else |
|
return 0; |
|
|
|
if (s->au->payloadUsedSize > 0) { |
|
ret = ff_get_encode_buffer(avctx, pkt, s->au->payloadUsedSize, 0); |
|
if (ret < 0) |
|
return ret; |
|
|
|
memcpy(pkt->data, s->au->payload, s->au->payloadUsedSize); |
|
|
|
if (s->au->ctsValid) |
|
pkt->pts = s->au->cts; |
|
if (s->au->dtsValid) |
|
pkt->dts = s->au->dts; |
|
pkt->flags |= AV_PKT_FLAG_KEY * s->au->rap; |
|
|
|
*got_packet = 1; |
|
return 0; |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static const enum AVPixelFormat pix_fmts_vvenc[] = { |
|
AV_PIX_FMT_YUV420P10, |
|
AV_PIX_FMT_NONE |
|
}; |
|
|
|
#define OFFSET(x) offsetof(VVenCContext, x) |
|
#define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM |
|
static const AVOption options[] = { |
|
{ "preset", "set encoding preset", OFFSET(preset), AV_OPT_TYPE_INT, {.i64 = 2}, 0, 4, VE, "preset"}, |
|
{ "faster", "0", 0, AV_OPT_TYPE_CONST, {.i64 = VVENC_FASTER}, INT_MIN, INT_MAX, VE, "preset" }, |
|
{ "fast", "1", 0, AV_OPT_TYPE_CONST, {.i64 = VVENC_FAST}, INT_MIN, INT_MAX, VE, "preset" }, |
|
{ "medium", "2", 0, AV_OPT_TYPE_CONST, {.i64 = VVENC_MEDIUM}, INT_MIN, INT_MAX, VE, "preset" }, |
|
{ "slow", "3", 0, AV_OPT_TYPE_CONST, {.i64 = VVENC_SLOW}, INT_MIN, INT_MAX, VE, "preset" }, |
|
{ "slower", "4", 0, AV_OPT_TYPE_CONST, {.i64 = VVENC_SLOWER}, INT_MIN, INT_MAX, VE, "preset" }, |
|
{ "qp", "set quantization", OFFSET(qp), AV_OPT_TYPE_INT, {.i64 = 32}, -1, 63, VE }, |
|
{ "qpa", "set subjective (perceptually motivated) optimization", OFFSET(qpa), AV_OPT_TYPE_BOOL, {.i64 = 1}, 0, 1, VE}, |
|
{ "passlogfile", "Filename for 2 pass stats", OFFSET(stats), AV_OPT_TYPE_STRING, {.str = NULL}, 0, 0, VE}, |
|
{ "stats", "Filename for 2 pass stats", OFFSET(stats), AV_OPT_TYPE_STRING, {.str = NULL}, 0, 0, VE}, |
|
{ "period", "set (intra) refresh period in seconds", OFFSET(intra_refresh_sec), AV_OPT_TYPE_INT, {.i64 = 1}, 1, INT_MAX, VE }, |
|
{ "vvenc-params", "set the vvenc configuration using a :-separated list of key=value parameters", OFFSET(vvenc_opts), AV_OPT_TYPE_DICT, { 0 }, 0, 0, VE }, |
|
{ "level", "Specify level (as defined by Annex A)", OFFSET(level), AV_OPT_TYPE_STRING, {.str = NULL}, 0, 0, VE}, |
|
{ "tier", "set vvc tier", OFFSET(tier), AV_OPT_TYPE_INT, {.i64 = 0}, 0, 1, VE, "tier"}, |
|
{ "main", "main", 0, AV_OPT_TYPE_CONST, {.i64 = 0}, INT_MIN, INT_MAX, VE, "tier"}, |
|
{ "high", "high", 0, AV_OPT_TYPE_CONST, {.i64 = 1}, INT_MIN, INT_MAX, VE, "tier"}, |
|
{NULL} |
|
}; |
|
|
|
static const AVClass class = { |
|
.class_name = "libvvenc", |
|
.item_name = av_default_item_name, |
|
.option = options, |
|
.version = LIBAVUTIL_VERSION_INT, |
|
}; |
|
|
|
static const FFCodecDefault vvenc_defaults[] = { |
|
{ "b", "0" }, |
|
{ "g", "-1" }, |
|
{ NULL }, |
|
}; |
|
|
|
const FFCodec ff_libvvenc_encoder = { |
|
.p.name = "libvvenc", |
|
CODEC_LONG_NAME("libvvenc H.266 / VVC"), |
|
.p.type = AVMEDIA_TYPE_VIDEO, |
|
.p.id = AV_CODEC_ID_VVC, |
|
.p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY | |
|
AV_CODEC_CAP_OTHER_THREADS, |
|
.p.profiles = NULL_IF_CONFIG_SMALL(ff_vvc_profiles), |
|
.p.priv_class = &class, |
|
.p.wrapper_name = "libvvenc", |
|
.priv_data_size = sizeof(VVenCContext), |
|
.p.pix_fmts = pix_fmts_vvenc, |
|
.init = vvenc_init, |
|
FF_CODEC_ENCODE_CB(vvenc_frame), |
|
.close = vvenc_close, |
|
.defaults = vvenc_defaults, |
|
.caps_internal = FF_CODEC_CAP_INIT_CLEANUP | FF_CODEC_CAP_AUTO_THREADS |
|
};
|
|
|