mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
544 lines
18 KiB
544 lines
18 KiB
/* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
#ifndef AVCODEC_VAAPI_ENCODE_H |
|
#define AVCODEC_VAAPI_ENCODE_H |
|
|
|
#include <stdint.h> |
|
|
|
#include <va/va.h> |
|
|
|
#if VA_CHECK_VERSION(1, 0, 0) |
|
#include <va/va_str.h> |
|
#endif |
|
|
|
#include "libavutil/hwcontext.h" |
|
#include "libavutil/hwcontext_vaapi.h" |
|
#include "libavutil/fifo.h" |
|
|
|
#include "avcodec.h" |
|
#include "hwconfig.h" |
|
|
|
struct VAAPIEncodeType; |
|
struct VAAPIEncodePicture; |
|
|
|
enum { |
|
MAX_CONFIG_ATTRIBUTES = 4, |
|
MAX_GLOBAL_PARAMS = 4, |
|
MAX_DPB_SIZE = 16, |
|
MAX_PICTURE_REFERENCES = 2, |
|
MAX_REORDER_DELAY = 16, |
|
MAX_PARAM_BUFFER_SIZE = 1024, |
|
// A.4.1: table A.6 allows at most 22 tile rows for any level. |
|
MAX_TILE_ROWS = 22, |
|
// A.4.1: table A.6 allows at most 20 tile columns for any level. |
|
MAX_TILE_COLS = 20, |
|
MAX_ASYNC_DEPTH = 64, |
|
MAX_REFERENCE_LIST_NUM = 2, |
|
}; |
|
|
|
extern const AVCodecHWConfigInternal *const ff_vaapi_encode_hw_configs[]; |
|
|
|
enum { |
|
PICTURE_TYPE_IDR = 0, |
|
PICTURE_TYPE_I = 1, |
|
PICTURE_TYPE_P = 2, |
|
PICTURE_TYPE_B = 3, |
|
}; |
|
|
|
typedef struct VAAPIEncodeSlice { |
|
int index; |
|
int row_start; |
|
int row_size; |
|
int block_start; |
|
int block_size; |
|
void *codec_slice_params; |
|
} VAAPIEncodeSlice; |
|
|
|
typedef struct VAAPIEncodePicture { |
|
struct VAAPIEncodePicture *next; |
|
|
|
int64_t display_order; |
|
int64_t encode_order; |
|
int64_t pts; |
|
int64_t duration; |
|
int force_idr; |
|
|
|
void *opaque; |
|
AVBufferRef *opaque_ref; |
|
|
|
#if VA_CHECK_VERSION(1, 0, 0) |
|
// ROI regions. |
|
VAEncROI *roi; |
|
#else |
|
void *roi; |
|
#endif |
|
|
|
int type; |
|
int b_depth; |
|
int encode_issued; |
|
int encode_complete; |
|
|
|
AVFrame *input_image; |
|
VASurfaceID input_surface; |
|
|
|
AVFrame *recon_image; |
|
VASurfaceID recon_surface; |
|
|
|
int nb_param_buffers; |
|
VABufferID *param_buffers; |
|
|
|
/* Refcounted via the refstruct-API */ |
|
VABufferID *output_buffer_ref; |
|
VABufferID output_buffer; |
|
|
|
void *priv_data; |
|
void *codec_picture_params; |
|
|
|
// Whether this picture is a reference picture. |
|
int is_reference; |
|
|
|
// The contents of the DPB after this picture has been decoded. |
|
// This will contain the picture itself if it is a reference picture, |
|
// but not if it isn't. |
|
int nb_dpb_pics; |
|
struct VAAPIEncodePicture *dpb[MAX_DPB_SIZE]; |
|
// The reference pictures used in decoding this picture. If they are |
|
// used by later pictures they will also appear in the DPB. ref[0][] for |
|
// previous reference frames. ref[1][] for future reference frames. |
|
int nb_refs[MAX_REFERENCE_LIST_NUM]; |
|
struct VAAPIEncodePicture *refs[MAX_REFERENCE_LIST_NUM][MAX_PICTURE_REFERENCES]; |
|
// The previous reference picture in encode order. Must be in at least |
|
// one of the reference list and DPB list. |
|
struct VAAPIEncodePicture *prev; |
|
// Reference count for other pictures referring to this one through |
|
// the above pointers, directly from incomplete pictures and indirectly |
|
// through completed pictures. |
|
int ref_count[2]; |
|
int ref_removed[2]; |
|
|
|
int nb_slices; |
|
VAAPIEncodeSlice *slices; |
|
|
|
/** |
|
* indicate if current frame is an independent frame that the coded data |
|
* can be pushed to downstream directly. Coded of non-independent frame |
|
* data will be concatenated into next independent frame. |
|
*/ |
|
int non_independent_frame; |
|
/** Tail data of current pic, used only for repeat header of AV1. */ |
|
char tail_data[MAX_PARAM_BUFFER_SIZE]; |
|
/** Byte length of tail_data. */ |
|
size_t tail_size; |
|
} VAAPIEncodePicture; |
|
|
|
typedef struct VAAPIEncodeProfile { |
|
// lavc profile value (AV_PROFILE_*). |
|
int av_profile; |
|
// Supported bit depth. |
|
int depth; |
|
// Number of components. |
|
int nb_components; |
|
// Chroma subsampling in width dimension. |
|
int log2_chroma_w; |
|
// Chroma subsampling in height dimension. |
|
int log2_chroma_h; |
|
// VAAPI profile value. |
|
VAProfile va_profile; |
|
} VAAPIEncodeProfile; |
|
|
|
enum { |
|
RC_MODE_AUTO, |
|
RC_MODE_CQP, |
|
RC_MODE_CBR, |
|
RC_MODE_VBR, |
|
RC_MODE_ICQ, |
|
RC_MODE_QVBR, |
|
RC_MODE_AVBR, |
|
RC_MODE_MAX = RC_MODE_AVBR, |
|
}; |
|
|
|
typedef struct VAAPIEncodeRCMode { |
|
// Mode from above enum (RC_MODE_*). |
|
int mode; |
|
// Name. |
|
const char *name; |
|
// Supported in the compile-time VAAPI version. |
|
int supported; |
|
// VA mode value (VA_RC_*). |
|
uint32_t va_mode; |
|
// Uses bitrate parameters. |
|
int bitrate; |
|
// Supports maxrate distinct from bitrate. |
|
int maxrate; |
|
// Uses quality value. |
|
int quality; |
|
// Supports HRD/VBV parameters. |
|
int hrd; |
|
} VAAPIEncodeRCMode; |
|
|
|
typedef struct VAAPIEncodeContext { |
|
const AVClass *class; |
|
|
|
// Codec-specific hooks. |
|
const struct VAAPIEncodeType *codec; |
|
|
|
// Global options. |
|
|
|
// Use low power encoding mode. |
|
int low_power; |
|
|
|
// Number of I frames between IDR frames. |
|
int idr_interval; |
|
|
|
// Desired B frame reference depth. |
|
int desired_b_depth; |
|
|
|
// Max Frame Size |
|
int max_frame_size; |
|
|
|
// Explicitly set RC mode (otherwise attempt to pick from |
|
// available modes). |
|
int explicit_rc_mode; |
|
|
|
// Explicitly-set QP, for use with the "qp" options. |
|
// (Forces CQP mode when set, overriding everything else.) |
|
int explicit_qp; |
|
|
|
// Desired packed headers. |
|
unsigned int desired_packed_headers; |
|
|
|
// The required size of surfaces. This is probably the input |
|
// size (AVCodecContext.width|height) aligned up to whatever |
|
// block size is required by the codec. |
|
int surface_width; |
|
int surface_height; |
|
|
|
// The block size for slice calculations. |
|
int slice_block_width; |
|
int slice_block_height; |
|
|
|
// Everything above this point must be set before calling |
|
// ff_vaapi_encode_init(). |
|
|
|
// Chosen encoding profile details. |
|
const VAAPIEncodeProfile *profile; |
|
|
|
// Chosen rate control mode details. |
|
const VAAPIEncodeRCMode *rc_mode; |
|
// RC quality level - meaning depends on codec and RC mode. |
|
// In CQP mode this sets the fixed quantiser value. |
|
int rc_quality; |
|
|
|
// Encoding profile (VAProfile*). |
|
VAProfile va_profile; |
|
// Encoding entrypoint (VAEntryoint*). |
|
VAEntrypoint va_entrypoint; |
|
// Rate control mode. |
|
unsigned int va_rc_mode; |
|
// Bitrate for codec-specific encoder parameters. |
|
unsigned int va_bit_rate; |
|
// Packed headers which will actually be sent. |
|
unsigned int va_packed_headers; |
|
|
|
// Configuration attributes to use when creating va_config. |
|
VAConfigAttrib config_attributes[MAX_CONFIG_ATTRIBUTES]; |
|
int nb_config_attributes; |
|
|
|
VAConfigID va_config; |
|
VAContextID va_context; |
|
|
|
AVBufferRef *device_ref; |
|
AVHWDeviceContext *device; |
|
AVVAAPIDeviceContext *hwctx; |
|
|
|
// The hardware frame context containing the input frames. |
|
AVBufferRef *input_frames_ref; |
|
AVHWFramesContext *input_frames; |
|
|
|
// The hardware frame context containing the reconstructed frames. |
|
AVBufferRef *recon_frames_ref; |
|
AVHWFramesContext *recon_frames; |
|
|
|
// Pool of (reusable) bitstream output buffers. |
|
struct FFRefStructPool *output_buffer_pool; |
|
|
|
// Global parameters which will be applied at the start of the |
|
// sequence (includes rate control parameters below). |
|
int global_params_type[MAX_GLOBAL_PARAMS]; |
|
const void *global_params [MAX_GLOBAL_PARAMS]; |
|
size_t global_params_size[MAX_GLOBAL_PARAMS]; |
|
int nb_global_params; |
|
|
|
// Rate control parameters. |
|
VAEncMiscParameterRateControl rc_params; |
|
VAEncMiscParameterHRD hrd_params; |
|
VAEncMiscParameterFrameRate fr_params; |
|
VAEncMiscParameterBufferMaxFrameSize mfs_params; |
|
#if VA_CHECK_VERSION(0, 36, 0) |
|
VAEncMiscParameterBufferQualityLevel quality_params; |
|
#endif |
|
|
|
// Per-sequence parameter structure (VAEncSequenceParameterBuffer*). |
|
void *codec_sequence_params; |
|
|
|
// Per-sequence parameters found in the per-picture parameter |
|
// structure (VAEncPictureParameterBuffer*). |
|
void *codec_picture_params; |
|
|
|
// Current encoding window, in display (input) order. |
|
VAAPIEncodePicture *pic_start, *pic_end; |
|
// The next picture to use as the previous reference picture in |
|
// encoding order. Order from small to large in encoding order. |
|
VAAPIEncodePicture *next_prev[MAX_PICTURE_REFERENCES]; |
|
int nb_next_prev; |
|
|
|
// Next input order index (display order). |
|
int64_t input_order; |
|
// Number of frames that output is behind input. |
|
int64_t output_delay; |
|
// Next encode order index. |
|
int64_t encode_order; |
|
// Number of frames decode output will need to be delayed. |
|
int64_t decode_delay; |
|
// Next output order index (in encode order). |
|
int64_t output_order; |
|
|
|
// Timestamp handling. |
|
int64_t first_pts; |
|
int64_t dts_pts_diff; |
|
int64_t ts_ring[MAX_REORDER_DELAY * 3 + |
|
MAX_ASYNC_DEPTH]; |
|
|
|
// Slice structure. |
|
int slice_block_rows; |
|
int slice_block_cols; |
|
int nb_slices; |
|
int slice_size; |
|
|
|
// Tile encoding. |
|
int tile_cols; |
|
int tile_rows; |
|
// Tile width of the i-th column. |
|
int col_width[MAX_TILE_COLS]; |
|
// Tile height of i-th row. |
|
int row_height[MAX_TILE_ROWS]; |
|
// Location of the i-th tile column boundary. |
|
int col_bd[MAX_TILE_COLS + 1]; |
|
// Location of the i-th tile row boundary. |
|
int row_bd[MAX_TILE_ROWS + 1]; |
|
|
|
// Frame type decision. |
|
int gop_size; |
|
int closed_gop; |
|
int gop_per_idr; |
|
int p_per_i; |
|
int max_b_depth; |
|
int b_per_p; |
|
int force_idr; |
|
int idr_counter; |
|
int gop_counter; |
|
int end_of_stream; |
|
int p_to_gpb; |
|
|
|
// Whether the driver supports ROI at all. |
|
int roi_allowed; |
|
// Maximum number of regions supported by the driver. |
|
int roi_max_regions; |
|
// Quantisation range for offset calculations. Set by codec-specific |
|
// code, as it may change based on parameters. |
|
int roi_quant_range; |
|
|
|
// The encoder does not support cropping information, so warn about |
|
// it the first time we encounter any nonzero crop fields. |
|
int crop_warned; |
|
// If the driver does not support ROI then warn the first time we |
|
// encounter a frame with ROI side data. |
|
int roi_warned; |
|
|
|
AVFrame *frame; |
|
|
|
// Whether the driver support vaSyncBuffer |
|
int has_sync_buffer_func; |
|
// Store buffered pic |
|
AVFifo *encode_fifo; |
|
// Max number of frame buffered in encoder. |
|
int async_depth; |
|
|
|
/** Head data for current output pkt, used only for AV1. */ |
|
//void *header_data; |
|
//size_t header_data_size; |
|
|
|
/** |
|
* Buffered coded data of a pic if it is an non-independent frame. |
|
* This is a RefStruct reference. |
|
*/ |
|
VABufferID *coded_buffer_ref; |
|
|
|
/** Tail data of a pic, now only used for av1 repeat frame header. */ |
|
AVPacket *tail_pkt; |
|
} VAAPIEncodeContext; |
|
|
|
enum { |
|
// Codec supports controlling the subdivision of pictures into slices. |
|
FLAG_SLICE_CONTROL = 1 << 0, |
|
// Codec only supports constant quality (no rate control). |
|
FLAG_CONSTANT_QUALITY_ONLY = 1 << 1, |
|
// Codec is intra-only. |
|
FLAG_INTRA_ONLY = 1 << 2, |
|
// Codec supports B-pictures. |
|
FLAG_B_PICTURES = 1 << 3, |
|
// Codec supports referencing B-pictures. |
|
FLAG_B_PICTURE_REFERENCES = 1 << 4, |
|
// Codec supports non-IDR key pictures (that is, key pictures do |
|
// not necessarily empty the DPB). |
|
FLAG_NON_IDR_KEY_PICTURES = 1 << 5, |
|
// Codec output packet without timestamp delay, which means the |
|
// output packet has same PTS and DTS. |
|
FLAG_TIMESTAMP_NO_DELAY = 1 << 6, |
|
}; |
|
|
|
typedef struct VAAPIEncodeType { |
|
// List of supported profiles and corresponding VAAPI profiles. |
|
// (Must end with AV_PROFILE_UNKNOWN.) |
|
const VAAPIEncodeProfile *profiles; |
|
|
|
// Codec feature flags. |
|
int flags; |
|
|
|
// Default quality for this codec - used as quantiser or RC quality |
|
// factor depending on RC mode. |
|
int default_quality; |
|
|
|
// Determine encode parameters like block sizes for surface alignment |
|
// and slices. This may need to query the profile and entrypoint, |
|
// which will be available when this function is called. If not set, |
|
// assume that all blocks are 16x16 and that surfaces should be |
|
// aligned to match this. |
|
int (*get_encoder_caps)(AVCodecContext *avctx); |
|
|
|
// Perform any extra codec-specific configuration after the |
|
// codec context is initialised (set up the private data and |
|
// add any necessary global parameters). |
|
int (*configure)(AVCodecContext *avctx); |
|
|
|
// The size of any private data structure associated with each |
|
// picture (can be zero if not required). |
|
size_t picture_priv_data_size; |
|
|
|
// The size of the parameter structures: |
|
// sizeof(VAEnc{type}ParameterBuffer{codec}). |
|
size_t sequence_params_size; |
|
size_t picture_params_size; |
|
size_t slice_params_size; |
|
|
|
// Fill the parameter structures. |
|
int (*init_sequence_params)(AVCodecContext *avctx); |
|
int (*init_picture_params)(AVCodecContext *avctx, |
|
VAAPIEncodePicture *pic); |
|
int (*init_slice_params)(AVCodecContext *avctx, |
|
VAAPIEncodePicture *pic, |
|
VAAPIEncodeSlice *slice); |
|
|
|
// The type used by the packed header: this should look like |
|
// VAEncPackedHeader{something}. |
|
int sequence_header_type; |
|
int picture_header_type; |
|
int slice_header_type; |
|
|
|
// Write the packed header data to the provided buffer. |
|
// The sequence header is also used to fill the codec extradata |
|
// when the encoder is starting. |
|
int (*write_sequence_header)(AVCodecContext *avctx, |
|
char *data, size_t *data_len); |
|
int (*write_picture_header)(AVCodecContext *avctx, |
|
VAAPIEncodePicture *pic, |
|
char *data, size_t *data_len); |
|
int (*write_slice_header)(AVCodecContext *avctx, |
|
VAAPIEncodePicture *pic, |
|
VAAPIEncodeSlice *slice, |
|
char *data, size_t *data_len); |
|
|
|
// Fill an extra parameter structure, which will then be |
|
// passed to vaRenderPicture(). Will be called repeatedly |
|
// with increasing index argument until AVERROR_EOF is |
|
// returned. |
|
int (*write_extra_buffer)(AVCodecContext *avctx, |
|
VAAPIEncodePicture *pic, |
|
int index, int *type, |
|
char *data, size_t *data_len); |
|
|
|
// Write an extra packed header. Will be called repeatedly |
|
// with increasing index argument until AVERROR_EOF is |
|
// returned. |
|
int (*write_extra_header)(AVCodecContext *avctx, |
|
VAAPIEncodePicture *pic, |
|
int index, int *type, |
|
char *data, size_t *data_len); |
|
} VAAPIEncodeType; |
|
|
|
|
|
int ff_vaapi_encode_receive_packet(AVCodecContext *avctx, AVPacket *pkt); |
|
|
|
int ff_vaapi_encode_init(AVCodecContext *avctx); |
|
int ff_vaapi_encode_close(AVCodecContext *avctx); |
|
|
|
|
|
#define VAAPI_ENCODE_COMMON_OPTIONS \ |
|
{ "low_power", \ |
|
"Use low-power encoding mode (only available on some platforms; " \ |
|
"may not support all encoding features)", \ |
|
OFFSET(common.low_power), AV_OPT_TYPE_BOOL, \ |
|
{ .i64 = 0 }, 0, 1, FLAGS }, \ |
|
{ "idr_interval", \ |
|
"Distance (in I-frames) between IDR frames", \ |
|
OFFSET(common.idr_interval), AV_OPT_TYPE_INT, \ |
|
{ .i64 = 0 }, 0, INT_MAX, FLAGS }, \ |
|
{ "b_depth", \ |
|
"Maximum B-frame reference depth", \ |
|
OFFSET(common.desired_b_depth), AV_OPT_TYPE_INT, \ |
|
{ .i64 = 1 }, 1, INT_MAX, FLAGS }, \ |
|
{ "async_depth", "Maximum processing parallelism. " \ |
|
"Increase this to improve single channel performance. This option " \ |
|
"doesn't work if driver doesn't implement vaSyncBuffer function.", \ |
|
OFFSET(common.async_depth), AV_OPT_TYPE_INT, \ |
|
{ .i64 = 2 }, 1, MAX_ASYNC_DEPTH, FLAGS }, \ |
|
{ "max_frame_size", \ |
|
"Maximum frame size (in bytes)",\ |
|
OFFSET(common.max_frame_size), AV_OPT_TYPE_INT, \ |
|
{ .i64 = 0 }, 0, INT_MAX, FLAGS } |
|
|
|
#define VAAPI_ENCODE_RC_MODE(name, desc) \ |
|
{ #name, desc, 0, AV_OPT_TYPE_CONST, { .i64 = RC_MODE_ ## name }, \ |
|
0, 0, FLAGS, .unit = "rc_mode" } |
|
#define VAAPI_ENCODE_RC_OPTIONS \ |
|
{ "rc_mode",\ |
|
"Set rate control mode", \ |
|
OFFSET(common.explicit_rc_mode), AV_OPT_TYPE_INT, \ |
|
{ .i64 = RC_MODE_AUTO }, RC_MODE_AUTO, RC_MODE_MAX, FLAGS, .unit = "rc_mode" }, \ |
|
{ "auto", "Choose mode automatically based on other parameters", \ |
|
0, AV_OPT_TYPE_CONST, { .i64 = RC_MODE_AUTO }, 0, 0, FLAGS, .unit = "rc_mode" }, \ |
|
VAAPI_ENCODE_RC_MODE(CQP, "Constant-quality"), \ |
|
VAAPI_ENCODE_RC_MODE(CBR, "Constant-bitrate"), \ |
|
VAAPI_ENCODE_RC_MODE(VBR, "Variable-bitrate"), \ |
|
VAAPI_ENCODE_RC_MODE(ICQ, "Intelligent constant-quality"), \ |
|
VAAPI_ENCODE_RC_MODE(QVBR, "Quality-defined variable-bitrate"), \ |
|
VAAPI_ENCODE_RC_MODE(AVBR, "Average variable-bitrate") |
|
|
|
|
|
#endif /* AVCODEC_VAAPI_ENCODE_H */
|
|
|