FFmpeg/libavcodec/vulkan_decode.h

/*
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#ifndef AVCODEC_VULKAN_DECODE_H
#define AVCODEC_VULKAN_DECODE_H

#include "codec_id.h"
#include "decode.h"
#include "hwaccel_internal.h"
#include "internal.h"

#include "vulkan_video.h"

typedef struct FFVulkanDecodeDescriptor {
    enum AVCodecID                   codec_id;
    FFVulkanExtensions               decode_extension;
    VkQueueFlagBits                  queue_flags;
    VkVideoCodecOperationFlagBitsKHR decode_op;

    VkExtensionProperties ext_props;
} FFVulkanDecodeDescriptor;

typedef struct FFVulkanDecodeProfileData {
    VkVideoDecodeH264ProfileInfoKHR h264_profile;
    VkVideoDecodeH265ProfileInfoKHR h265_profile;
    VkVideoDecodeAV1ProfileInfoKHR av1_profile;
    VkVideoDecodeUsageInfoKHR usage;
    VkVideoProfileInfoKHR profile;
    VkVideoProfileListInfoKHR profile_list;
} FFVulkanDecodeProfileData;

typedef struct FFVulkanDecodeShared {
    FFVulkanContext s;
    FFVkVideoCommon common;
    AVVulkanDeviceQueueFamily *qf;
    FFVkExecPool exec_pool;

    AVBufferPool *buf_pool;

    VkVideoCapabilitiesKHR caps;
    VkVideoDecodeCapabilitiesKHR dec_caps;

    VkVideoSessionParametersKHR empty_session_params;
} FFVulkanDecodeShared;

typedef struct FFVulkanDecodeContext {
    FFVulkanDecodeShared *shared_ctx;
    AVBufferRef *session_params;

    int dedicated_dpb; /* Oddity  #1 - separate DPB images */
    int external_fg;   /* Oddity  #2 - hardware can't apply film grain */
    uint32_t frame_id_alloc_mask; /* For AV1 only */

    /* Workaround for NVIDIA drivers tested with CTS version 1.3.8 for AV1.
     * The tests were incorrect as the OrderHints were offset by 1. */
    int quirk_av1_offset;

    /* Thread-local state below */
    struct HEVCHeaderSet *hevc_headers;
    size_t hevc_headers_size;

    uint32_t                       *slice_off;
    unsigned int                    slice_off_max;
} FFVulkanDecodeContext;

typedef struct FFVulkanDecodePicture {
    AVFrame                        *dpb_frame;      /* Only used for out-of-place decoding. */

    VkImageView                     img_view_ref;   /* Image representation view (reference) */
    VkImageView                     img_view_out;   /* Image representation view (output-only) */
    VkImageView                     img_view_dest;  /* Set to img_view_out if no layered refs are used */
    VkImageAspectFlags              img_aspect;     /* Image plane mask bits */
    VkImageAspectFlags              img_aspect_ref; /* Only used for out-of-place decoding */

    VkSemaphore                     sem;
    uint64_t                        sem_value;

    /* Current picture */
    VkVideoPictureResourceInfoKHR   ref;
    VkVideoReferenceSlotInfoKHR     ref_slot;

    /* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */
    VkVideoPictureResourceInfoKHR   refs     [36];
    VkVideoReferenceSlotInfoKHR     ref_slots[36];

    /* Main decoding struct */
    VkVideoDecodeInfoKHR            decode_info;

    /* Slice data */
    AVBufferRef                    *slices_buf;
    size_t                          slices_size;

    /* Vulkan functions needed for destruction, as no other context is guaranteed to exist */
    PFN_vkWaitSemaphores            wait_semaphores;
    PFN_vkDestroyImageView          destroy_image_view;
} FFVulkanDecodePicture;

/**
 * Initialize decoder.
 */
int ff_vk_decode_init(AVCodecContext *avctx);

/**
 * Synchronize the contexts between 2 threads.
 */
int ff_vk_update_thread_context(AVCodecContext *dst, const AVCodecContext *src);

/**
 * Initialize hw_frames_ctx with the parameters needed to decode the stream
 * using the parameters from avctx.
 *
 * NOTE: if avctx->internal->hwaccel_priv_data exists, will partially initialize
 * the context.
 */
int ff_vk_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx);

/**
 * Removes current session parameters to recreate them
 */
int ff_vk_params_invalidate(AVCodecContext *avctx, int t, const uint8_t *b, uint32_t s);

/**
 * Prepare a frame, creates the image view, and sets up the dpb fields.
 */
int ff_vk_decode_prepare_frame(FFVulkanDecodeContext *dec, AVFrame *pic,
                               FFVulkanDecodePicture *vkpic, int is_current,
                               int alloc_dpb);

/**
 * Add slice data to frame.
 */
int ff_vk_decode_add_slice(AVCodecContext *avctx, FFVulkanDecodePicture *vp,
                           const uint8_t *data, size_t size, int add_startcode,
                           uint32_t *nb_slices, const uint32_t **offsets);

/**
 * Decode a frame.
 */
int ff_vk_decode_frame(AVCodecContext *avctx,
                       AVFrame *pic,    FFVulkanDecodePicture *vp,
                       AVFrame *rpic[], FFVulkanDecodePicture *rvkp[]);

/**
 * Free a frame and its state.
 */
void ff_vk_decode_free_frame(AVHWDeviceContext *dev_ctx, FFVulkanDecodePicture *vp);

/**
 * Get an FFVkBuffer suitable for decoding from.
 */
int ff_vk_get_decode_buffer(FFVulkanDecodeContext *ctx, AVBufferRef **buf,
                            void *create_pNext, size_t size);

/**
 * Create VkVideoSessionParametersKHR wrapped in an AVBufferRef.
 */
int ff_vk_decode_create_params(AVBufferRef **par_ref, void *logctx, FFVulkanDecodeShared *ctx,
                               const VkVideoSessionParametersCreateInfoKHR *session_params_create);

/**
 * Flush decoder.
 */
void ff_vk_decode_flush(AVCodecContext *avctx);

/**
 * Free decoder.
 */
int ff_vk_decode_uninit(AVCodecContext *avctx);

#endif /* AVCODEC_VULKAN_DECODE_H */
libavcodec: add Vulkan common video decoding code 2 years ago			`/*`
			`* This file is part of FFmpeg.`
			`*`
			`* FFmpeg is free software; you can redistribute it and/or`
			`* modify it under the terms of the GNU Lesser General Public`
			`* License as published by the Free Software Foundation; either`
			`* version 2.1 of the License, or (at your option) any later version.`
			`*`
			`* FFmpeg is distributed in the hope that it will be useful,`
			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU`
			`* Lesser General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU Lesser General Public`
			`* License along with FFmpeg; if not, write to the Free Software`
			`* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA`
			`*/`

			`#ifndef AVCODEC_VULKAN_DECODE_H`
			`#define AVCODEC_VULKAN_DECODE_H`

avcodec/vulkan_decode: Un-sparse extensions table Only three of the 226 (== AV_CODEC_ID_AV1) entries have been used. Unsparsing this table is especially important given that this array lives in .data.rel.ro. Reviewed-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 11 months ago			`#include "codec_id.h"`
libavcodec: add Vulkan common video decoding code 2 years ago			`#include "decode.h"`
avcodec/hwconfig: Move HWACCEL_CAP_* to a new header libavcodec/hwconfig.h currently contains HWACCEL_CAP_* flags as well as the definition of AVCodecHWConfigInternal and some macros to create them. The users of these two are nearly disjoint: The flags are used by files providing AVHWAccels whereas AVCodecHWConfigInternal is used by files providing codecs (for FFCodec.hw_configs). This patch therefore moves these flags to a new file hwaccel_internal.h. Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 2 years ago			`#include "hwaccel_internal.h"`
libavcodec: add Vulkan common video decoding code 2 years ago			`#include "internal.h"`

			`#include "vulkan_video.h"`

avcodec/vulkan_video: Merge dec part of FFVkCodecMap and extension props All the fields of FFVkCodecMap are either decoder-only or encoder-only (with the latter being unused and unset for now). Yet there is already a per-decoder struct containing static information about these decoders, namely VkExtensionProperties. This commit merges the decoder-parts of FFVkCodecMap with the VkExtensionProperties into a common structure. Given that FFVkCodecMap is now unused, it is removed. Reviewed-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 11 months ago			`typedef struct FFVulkanDecodeDescriptor {`
avcodec/vulkan_decode: Un-sparse extensions table Only three of the 226 (== AV_CODEC_ID_AV1) entries have been used. Unsparsing this table is especially important given that this array lives in .data.rel.ro. Reviewed-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 11 months ago			`enum AVCodecID codec_id;`
avcodec/vulkan_video: Merge dec part of FFVkCodecMap and extension props All the fields of FFVkCodecMap are either decoder-only or encoder-only (with the latter being unused and unset for now). Yet there is already a per-decoder struct containing static information about these decoders, namely VkExtensionProperties. This commit merges the decoder-parts of FFVkCodecMap with the VkExtensionProperties into a common structure. Given that FFVkCodecMap is now unused, it is removed. Reviewed-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 11 months ago			`FFVulkanExtensions decode_extension;`
vulkan_decode: add queue_flags field to specify queue used 2 months ago			`VkQueueFlagBits queue_flags;`
avcodec/vulkan_video: Merge dec part of FFVkCodecMap and extension props All the fields of FFVkCodecMap are either decoder-only or encoder-only (with the latter being unused and unset for now). Yet there is already a per-decoder struct containing static information about these decoders, namely VkExtensionProperties. This commit merges the decoder-parts of FFVkCodecMap with the VkExtensionProperties into a common structure. Given that FFVkCodecMap is now unused, it is removed. Reviewed-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 11 months ago			`VkVideoCodecOperationFlagBitsKHR decode_op;`

			`VkExtensionProperties ext_props;`
			`} FFVulkanDecodeDescriptor;`

libavcodec: add Vulkan common video decoding code 2 years ago			`typedef struct FFVulkanDecodeProfileData {`
			`VkVideoDecodeH264ProfileInfoKHR h264_profile;`
avcodec/vulkan_decode: fix struct type for h265_profile Signed-off-by: Kacper Michajłow <kasper93@gmail.com> 1 year ago			`VkVideoDecodeH265ProfileInfoKHR h265_profile;`
vulkan_av1: port to the new stable API Co-Authored-by: Dave Airlie <airlied@redhat.com> 1 year ago			`VkVideoDecodeAV1ProfileInfoKHR av1_profile;`
libavcodec: add Vulkan common video decoding code 2 years ago			`VkVideoDecodeUsageInfoKHR usage;`
			`VkVideoProfileInfoKHR profile;`
			`VkVideoProfileListInfoKHR profile_list;`
			`} FFVulkanDecodeProfileData;`

			`typedef struct FFVulkanDecodeShared {`
			`FFVulkanContext s;`
			`FFVkVideoCommon common;`
vulkan: do not reinvent a queue context struct We recently introduced a public field which was a superset of the queue context we used to have. Switch to using it entirely. This also allows us to get rid of the NIH function which was valid only for video queues. 2 months ago			`AVVulkanDeviceQueueFamily *qf;`
vulkan_decode: use a single execution pool Originally, the decoder had a single execution pool, with one execution context per thread. Execution pools were always intended to be thread-safe, as long as there were enough execution contexts in the pool to satisfy all threads. Due to synchronization issues, the threading part was removed at some point, and, for decoding, each thread had its own execution pool. Having a single execution pool per context is hacky, not to mention wasteful. Most importantly, we cannot associate single shaders across multiple execution pools for a single application. This means that we cannot use shaders to either apply film grain, or use this framework for software-defined decoders. The recent commits added threading capabilities back to the execution pool, and the number of contexts in each pool was increased. This was done with the assumption that the execution pool was singular, which it was not. This led to increased parallelism and number of frames in flight, which is taxing on memory. This commit finally restores proper threading behaviour. The validation layer has isses that are reported and addressed in the earlier commit. 2 months ago			`FFVkExecPool exec_pool;`
vulkan_decode: use the hwfc->user_opaque field to store the profile 2 years ago
vulkan_video: remove NIH pooled buffer implementation The code predates ff_vk_get_pooled_buffer(). 7 months ago			`AVBufferPool *buf_pool;`

vulkan_decode: use the hwfc->user_opaque field to store the profile 2 years ago			`VkVideoCapabilitiesKHR caps;`
			`VkVideoDecodeCapabilitiesKHR dec_caps;`
libavcodec: add Vulkan common video decoding code 2 years ago
			`VkVideoSessionParametersKHR empty_session_params;`
			`} FFVulkanDecodeShared;`

			`typedef struct FFVulkanDecodeContext {`
avcodec/vulkan_decode: Use RefStruct API for shared_ref Avoids allocations, error checks and indirections. Also increases type-safety. Reviewed-by: Lynne <dev@lynne.ee> Tested-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 1 year ago			`FFVulkanDecodeShared *shared_ctx;`
libavcodec: add Vulkan common video decoding code 2 years ago			`AVBufferRef *session_params;`

			`int dedicated_dpb; /* Oddity #1 - separate DPB images */`
av1dec: add Vulkan hwaccel 2 years ago			`int external_fg; /* Oddity #2 - hardware can't apply film grain */`
			`uint32_t frame_id_alloc_mask; /* For AV1 only */`
libavcodec: add Vulkan common video decoding code 2 years ago
vulkan_av1: add workaround for NVIDIA drivers tested on broken CTS The first release of the CTS for AV1 decoding had incorrect offsets for the OrderHints values. The CTS will be fixed, and eventually, the drivers will be updated to the proper spec-conforming behaviour, but we still need to add a workaround as this will take months. Only NVIDIA use these values at all, so limit the workaround to only NVIDIA. Also, other vendors don't tend to provide accurate CTS information. 10 months ago			`/* Workaround for NVIDIA drivers tested with CTS version 1.3.8 for AV1.`
			`* The tests were incorrect as the OrderHints were offset by 1. */`
			`int quirk_av1_offset;`

libavcodec: add Vulkan common video decoding code 2 years ago			`/* Thread-local state below */`
vulkan_hevc: switch from a buffer pool to a malloc and simplify Simpler and more robust now that contexts are not shared between threads. 1 year ago			`struct HEVCHeaderSet *hevc_headers;`
			`size_t hevc_headers_size;`
vulkan_decode: clean up slice handling Move the slice offsets buffer to the thread decode context. It isn't part of the resources for frame decoding, the driver has to process and finish with it at submission time. That way, it doesn't need to be alloc'd + freed on every frame. 2 years ago
			`uint32_t *slice_off;`
			`unsigned int slice_off_max;`
libavcodec: add Vulkan common video decoding code 2 years ago			`} FFVulkanDecodeContext;`

			`typedef struct FFVulkanDecodePicture {`
			`AVFrame dpb_frame; / Only used for out-of-place decoding. */`

			`VkImageView img_view_ref; /* Image representation view (reference) */`
			`VkImageView img_view_out; /* Image representation view (output-only) */`
			`VkImageView img_view_dest; /* Set to img_view_out if no layered refs are used */`
			`VkImageAspectFlags img_aspect; /* Image plane mask bits */`
			`VkImageAspectFlags img_aspect_ref; /* Only used for out-of-place decoding */`

			`VkSemaphore sem;`
			`uint64_t sem_value;`

			`/* Current picture */`
			`VkVideoPictureResourceInfoKHR ref;`
			`VkVideoReferenceSlotInfoKHR ref_slot;`

			`/* Picture refs. H264 has the maximum number of refs (36) of any supported codec. */`
			`VkVideoPictureResourceInfoKHR refs [36];`
			`VkVideoReferenceSlotInfoKHR ref_slots[36];`

			`/* Main decoding struct */`
			`VkVideoDecodeInfoKHR decode_info;`

			`/* Slice data */`
			`AVBufferRef *slices_buf;`
			`size_t slices_size;`
vulkan_decode: don't call get_proc_addr on every frame's destruction The issue is that we cannot rely on any context existing when we free frames. The Vulkan functions are loaded in each context separately, so until now, we've just been loading them on every frame's destruction. Rather than do this, just save the function pointers we need in each frame. The function pointers are guaranteed to not change and exist. 1 year ago
			`/* Vulkan functions needed for destruction, as no other context is guaranteed to exist */`
			`PFN_vkWaitSemaphores wait_semaphores;`
			`PFN_vkDestroyImageView destroy_image_view;`
libavcodec: add Vulkan common video decoding code 2 years ago			`} FFVulkanDecodePicture;`

			`/**`
			`* Initialize decoder.`
			`*/`
			`int ff_vk_decode_init(AVCodecContext *avctx);`

			`/**`
			`* Synchronize the contexts between 2 threads.`
			`*/`
			`int ff_vk_update_thread_context(AVCodecContext dst, const AVCodecContext src);`

			`/**`
			`* Initialize hw_frames_ctx with the parameters needed to decode the stream`
			`* using the parameters from avctx.`
			`*`
			`* NOTE: if avctx->internal->hwaccel_priv_data exists, will partially initialize`
			`* the context.`
			`*/`
			`int ff_vk_frame_params(AVCodecContext avctx, AVBufferRef hw_frames_ctx);`

			`/**`
vulkan_decode: simplify and make session parameter generation more robust This commit scraps a bool to signal to recreate the session parameters, but instead destroys them, forcing them to be recreated. As this can happen between start_frame and end_frame, do this at both places. 2 years ago			`* Removes current session parameters to recreate them`
libavcodec: add Vulkan common video decoding code 2 years ago			`*/`
vulkan_decode: simplify and make session parameter generation more robust This commit scraps a bool to signal to recreate the session parameters, but instead destroys them, forcing them to be recreated. As this can happen between start_frame and end_frame, do this at both places. 2 years ago			`int ff_vk_params_invalidate(AVCodecContext avctx, int t, const uint8_t b, uint32_t s);`
libavcodec: add Vulkan common video decoding code 2 years ago
			`/**`
			`* Prepare a frame, creates the image view, and sets up the dpb fields.`
			`*/`
			`int ff_vk_decode_prepare_frame(FFVulkanDecodeContext dec, AVFrame pic,`
			`FFVulkanDecodePicture *vkpic, int is_current,`
			`int alloc_dpb);`

			`/**`
			`* Add slice data to frame.`
			`*/`
			`int ff_vk_decode_add_slice(AVCodecContext avctx, FFVulkanDecodePicture vp,`
			`const uint8_t *data, size_t size, int add_startcode,`
			`uint32_t nb_slices, const uint32_t *offsets);`

			`/**`
			`* Decode a frame.`
			`*/`
			`int ff_vk_decode_frame(AVCodecContext *avctx,`
			`AVFrame pic, FFVulkanDecodePicture vp,`
			`AVFrame rpic[], FFVulkanDecodePicture rvkp[]);`

			`/**`
			`* Free a frame and its state.`
			`*/`
			`void ff_vk_decode_free_frame(AVHWDeviceContext dev_ctx, FFVulkanDecodePicture vp);`

			`/**`
			`* Get an FFVkBuffer suitable for decoding from.`
			`*/`
			`int ff_vk_get_decode_buffer(FFVulkanDecodeContext ctx, AVBufferRef *buf,`
			`void *create_pNext, size_t size);`

			`/**`
avcodec/vulkan_decode: Factor creating session params out, fix leak All Vulkan HWAccels share the same boilerplate code for creating session params and this includes a common bug: In case actually creating the video session parameters fails, the buffer destined to hold them leaks; in case of HEVC this is also true if get_data_set_buf() fails. This commit factors this code out and fixes the leak. Reviewed-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 1 year ago			`* Create VkVideoSessionParametersKHR wrapped in an AVBufferRef.`
libavcodec: add Vulkan common video decoding code 2 years ago			`*/`
avcodec/vulkan_decode: Factor creating session params out, fix leak All Vulkan HWAccels share the same boilerplate code for creating session params and this includes a common bug: In case actually creating the video session parameters fails, the buffer destined to hold them leaks; in case of HEVC this is also true if get_data_set_buf() fails. This commit factors this code out and fixes the leak. Reviewed-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com> 1 year ago			`int ff_vk_decode_create_params(AVBufferRef *par_ref, void logctx, FFVulkanDecodeShared *ctx,`
			`const VkVideoSessionParametersCreateInfoKHR *session_params_create);`
libavcodec: add Vulkan common video decoding code 2 years ago
			`/**`
			`* Flush decoder.`
			`*/`
			`void ff_vk_decode_flush(AVCodecContext *avctx);`

			`/**`
			`* Free decoder.`
			`*/`
			`int ff_vk_decode_uninit(AVCodecContext *avctx);`

			`#endif /* AVCODEC_VULKAN_DECODE_H */`