mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
2954 lines
96 KiB
2954 lines
96 KiB
/* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
#define CL_USE_DEPRECATED_OPENCL_1_2_APIS |
|
|
|
#include <string.h> |
|
|
|
#include "config.h" |
|
|
|
#include "avassert.h" |
|
#include "avstring.h" |
|
#include "common.h" |
|
#include "hwcontext.h" |
|
#include "hwcontext_internal.h" |
|
#include "hwcontext_opencl.h" |
|
#include "mem.h" |
|
#include "pixdesc.h" |
|
|
|
#if HAVE_OPENCL_VAAPI_BEIGNET |
|
#include <unistd.h> |
|
#include <va/va.h> |
|
#include <va/va_drmcommon.h> |
|
#include <CL/cl_intel.h> |
|
#include "hwcontext_vaapi.h" |
|
#endif |
|
|
|
#if HAVE_OPENCL_DRM_BEIGNET |
|
#include <unistd.h> |
|
#include <CL/cl_intel.h> |
|
#include "hwcontext_drm.h" |
|
#endif |
|
|
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
|
#if CONFIG_LIBMFX |
|
#include <mfx/mfxstructures.h> |
|
#endif |
|
#include <va/va.h> |
|
#include <CL/cl_va_api_media_sharing_intel.h> |
|
#include "hwcontext_vaapi.h" |
|
#endif |
|
|
|
#if HAVE_OPENCL_DXVA2 |
|
#define COBJMACROS |
|
#include <CL/cl_dx9_media_sharing.h> |
|
#include <dxva2api.h> |
|
#include "hwcontext_dxva2.h" |
|
#endif |
|
|
|
#if HAVE_OPENCL_D3D11 |
|
#include <CL/cl_d3d11.h> |
|
#include "hwcontext_d3d11va.h" |
|
#endif |
|
|
|
#if HAVE_OPENCL_DRM_ARM |
|
#include <CL/cl_ext.h> |
|
#include <drm_fourcc.h> |
|
#include "hwcontext_drm.h" |
|
#endif |
|
|
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA && CONFIG_LIBMFX |
|
extern int ff_qsv_get_surface_base_handle(mfxFrameSurface1 *surf, |
|
enum AVHWDeviceType base_dev_typ, |
|
void **base_handle); |
|
#endif |
|
|
|
|
|
typedef struct OpenCLDeviceContext { |
|
// Default command queue to use for transfer/mapping operations on |
|
// the device. If the user supplies one, this is a reference to it. |
|
// Otherwise, it is newly-created. |
|
cl_command_queue command_queue; |
|
|
|
// The platform the context exists on. This is needed to query and |
|
// retrieve extension functions. |
|
cl_platform_id platform_id; |
|
|
|
// Platform/device-specific functions. |
|
#if HAVE_OPENCL_DRM_BEIGNET |
|
int beignet_drm_mapping_usable; |
|
clCreateImageFromFdINTEL_fn clCreateImageFromFdINTEL; |
|
#endif |
|
|
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
|
int qsv_mapping_usable; |
|
clCreateFromVA_APIMediaSurfaceINTEL_fn |
|
clCreateFromVA_APIMediaSurfaceINTEL; |
|
clEnqueueAcquireVA_APIMediaSurfacesINTEL_fn |
|
clEnqueueAcquireVA_APIMediaSurfacesINTEL; |
|
clEnqueueReleaseVA_APIMediaSurfacesINTEL_fn |
|
clEnqueueReleaseVA_APIMediaSurfacesINTEL; |
|
#endif |
|
|
|
#if HAVE_OPENCL_DXVA2 |
|
int dxva2_mapping_usable; |
|
cl_dx9_media_adapter_type_khr dx9_media_adapter_type; |
|
|
|
clCreateFromDX9MediaSurfaceKHR_fn |
|
clCreateFromDX9MediaSurfaceKHR; |
|
clEnqueueAcquireDX9MediaSurfacesKHR_fn |
|
clEnqueueAcquireDX9MediaSurfacesKHR; |
|
clEnqueueReleaseDX9MediaSurfacesKHR_fn |
|
clEnqueueReleaseDX9MediaSurfacesKHR; |
|
#endif |
|
|
|
#if HAVE_OPENCL_D3D11 |
|
int d3d11_mapping_usable; |
|
clCreateFromD3D11Texture2DKHR_fn |
|
clCreateFromD3D11Texture2DKHR; |
|
clEnqueueAcquireD3D11ObjectsKHR_fn |
|
clEnqueueAcquireD3D11ObjectsKHR; |
|
clEnqueueReleaseD3D11ObjectsKHR_fn |
|
clEnqueueReleaseD3D11ObjectsKHR; |
|
#endif |
|
|
|
#if HAVE_OPENCL_DRM_ARM |
|
int drm_arm_mapping_usable; |
|
#endif |
|
} OpenCLDeviceContext; |
|
|
|
typedef struct OpenCLFramesContext { |
|
// Command queue used for transfer/mapping operations on this frames |
|
// context. If the user supplies one, this is a reference to it. |
|
// Otherwise, it is a reference to the default command queue for the |
|
// device. |
|
cl_command_queue command_queue; |
|
|
|
#if HAVE_OPENCL_DXVA2 || HAVE_OPENCL_D3D11 |
|
// For mapping APIs which have separate creation and acquire/release |
|
// steps, this stores the OpenCL memory objects corresponding to each |
|
// frame. |
|
int nb_mapped_frames; |
|
AVOpenCLFrameDescriptor *mapped_frames; |
|
#endif |
|
} OpenCLFramesContext; |
|
|
|
|
|
static void CL_CALLBACK opencl_error_callback(const char *errinfo, |
|
const void *private_info, |
|
size_t cb, |
|
void *user_data) |
|
{ |
|
AVHWDeviceContext *ctx = user_data; |
|
av_log(ctx, AV_LOG_ERROR, "OpenCL error: %s\n", errinfo); |
|
} |
|
|
|
static void opencl_device_free(AVHWDeviceContext *hwdev) |
|
{ |
|
AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
|
cl_int cle; |
|
|
|
cle = clReleaseContext(hwctx->context); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to release OpenCL " |
|
"context: %d.\n", cle); |
|
} |
|
} |
|
|
|
static struct { |
|
const char *key; |
|
cl_platform_info name; |
|
} opencl_platform_params[] = { |
|
{ "platform_profile", CL_PLATFORM_PROFILE }, |
|
{ "platform_version", CL_PLATFORM_VERSION }, |
|
{ "platform_name", CL_PLATFORM_NAME }, |
|
{ "platform_vendor", CL_PLATFORM_VENDOR }, |
|
{ "platform_extensions", CL_PLATFORM_EXTENSIONS }, |
|
}; |
|
|
|
static struct { |
|
const char *key; |
|
cl_device_info name; |
|
} opencl_device_params[] = { |
|
{ "device_name", CL_DEVICE_NAME }, |
|
{ "device_vendor", CL_DEVICE_VENDOR }, |
|
{ "driver_version", CL_DRIVER_VERSION }, |
|
{ "device_version", CL_DEVICE_VERSION }, |
|
{ "device_profile", CL_DEVICE_PROFILE }, |
|
{ "device_extensions", CL_DEVICE_EXTENSIONS }, |
|
}; |
|
|
|
static struct { |
|
const char *key; |
|
cl_device_type type; |
|
} opencl_device_types[] = { |
|
{ "cpu", CL_DEVICE_TYPE_CPU }, |
|
{ "gpu", CL_DEVICE_TYPE_GPU }, |
|
{ "accelerator", CL_DEVICE_TYPE_ACCELERATOR }, |
|
{ "custom", CL_DEVICE_TYPE_CUSTOM }, |
|
{ "default", CL_DEVICE_TYPE_DEFAULT }, |
|
{ "all", CL_DEVICE_TYPE_ALL }, |
|
}; |
|
|
|
static char *opencl_get_platform_string(cl_platform_id platform_id, |
|
cl_platform_info key) |
|
{ |
|
char *str; |
|
size_t size; |
|
cl_int cle; |
|
cle = clGetPlatformInfo(platform_id, key, 0, NULL, &size); |
|
if (cle != CL_SUCCESS) |
|
return NULL; |
|
str = av_malloc(size); |
|
if (!str) |
|
return NULL; |
|
cle = clGetPlatformInfo(platform_id, key, size, str, &size); |
|
if (cle != CL_SUCCESS) { |
|
av_free(str); |
|
return NULL; |
|
} |
|
av_assert0(strlen(str) + 1 == size); |
|
return str; |
|
} |
|
|
|
static char *opencl_get_device_string(cl_device_id device_id, |
|
cl_device_info key) |
|
{ |
|
char *str; |
|
size_t size; |
|
cl_int cle; |
|
cle = clGetDeviceInfo(device_id, key, 0, NULL, &size); |
|
if (cle != CL_SUCCESS) |
|
return NULL; |
|
str = av_malloc(size); |
|
if (!str) |
|
return NULL; |
|
cle = clGetDeviceInfo(device_id, key, size, str, &size); |
|
if (cle != CL_SUCCESS) { |
|
av_free(str); |
|
return NULL; |
|
} |
|
av_assert0(strlen(str) + 1== size); |
|
return str; |
|
} |
|
|
|
static int opencl_check_platform_extension(cl_platform_id platform_id, |
|
const char *name) |
|
{ |
|
char *str; |
|
int found = 0; |
|
str = opencl_get_platform_string(platform_id, |
|
CL_PLATFORM_EXTENSIONS); |
|
if (str && strstr(str, name)) |
|
found = 1; |
|
av_free(str); |
|
return found; |
|
} |
|
|
|
static int opencl_check_device_extension(cl_device_id device_id, |
|
const char *name) |
|
{ |
|
char *str; |
|
int found = 0; |
|
str = opencl_get_device_string(device_id, |
|
CL_DEVICE_EXTENSIONS); |
|
if (str && strstr(str, name)) |
|
found = 1; |
|
av_free(str); |
|
return found; |
|
} |
|
|
|
static av_unused int opencl_check_extension(AVHWDeviceContext *hwdev, |
|
const char *name) |
|
{ |
|
AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
|
OpenCLDeviceContext *priv = hwdev->internal->priv; |
|
|
|
if (opencl_check_platform_extension(priv->platform_id, name)) { |
|
av_log(hwdev, AV_LOG_DEBUG, |
|
"%s found as platform extension.\n", name); |
|
return 1; |
|
} |
|
|
|
if (opencl_check_device_extension(hwctx->device_id, name)) { |
|
av_log(hwdev, AV_LOG_DEBUG, |
|
"%s found as device extension.\n", name); |
|
return 1; |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int opencl_enumerate_platforms(AVHWDeviceContext *hwdev, |
|
cl_uint *nb_platforms, |
|
cl_platform_id **platforms, |
|
void *context) |
|
{ |
|
cl_int cle; |
|
|
|
cle = clGetPlatformIDs(0, NULL, nb_platforms); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get number of " |
|
"OpenCL platforms: %d.\n", cle); |
|
return AVERROR(ENODEV); |
|
} |
|
av_log(hwdev, AV_LOG_DEBUG, "%u OpenCL platforms found.\n", |
|
*nb_platforms); |
|
|
|
*platforms = av_malloc_array(*nb_platforms, sizeof(**platforms)); |
|
if (!*platforms) |
|
return AVERROR(ENOMEM); |
|
|
|
cle = clGetPlatformIDs(*nb_platforms, *platforms, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get list of OpenCL " |
|
"platforms: %d.\n", cle); |
|
av_freep(platforms); |
|
return AVERROR(ENODEV); |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int opencl_filter_platform(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
void *context) |
|
{ |
|
AVDictionary *opts = context; |
|
const AVDictionaryEntry *param; |
|
char *str; |
|
int i, ret = 0; |
|
|
|
for (i = 0; i < FF_ARRAY_ELEMS(opencl_platform_params); i++) { |
|
param = av_dict_get(opts, opencl_platform_params[i].key, |
|
NULL, 0); |
|
if (!param) |
|
continue; |
|
|
|
str = opencl_get_platform_string(platform_id, |
|
opencl_platform_params[i].name); |
|
if (!str) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to query %s " |
|
"of platform \"%s\".\n", |
|
opencl_platform_params[i].key, platform_name); |
|
return AVERROR_UNKNOWN; |
|
} |
|
if (!av_stristr(str, param->value)) { |
|
av_log(hwdev, AV_LOG_DEBUG, "%s does not match (\"%s\").\n", |
|
param->key, str); |
|
ret = 1; |
|
} |
|
av_free(str); |
|
} |
|
|
|
return ret; |
|
} |
|
|
|
static int opencl_enumerate_devices(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
cl_uint *nb_devices, |
|
cl_device_id **devices, |
|
void *context) |
|
{ |
|
cl_int cle; |
|
|
|
cle = clGetDeviceIDs(platform_id, CL_DEVICE_TYPE_ALL, |
|
0, NULL, nb_devices); |
|
if (cle == CL_DEVICE_NOT_FOUND) { |
|
av_log(hwdev, AV_LOG_DEBUG, "No devices found " |
|
"on platform \"%s\".\n", platform_name); |
|
*nb_devices = 0; |
|
return 0; |
|
} else if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get number of devices " |
|
"on platform \"%s\": %d.\n", platform_name, cle); |
|
return AVERROR(ENODEV); |
|
} |
|
av_log(hwdev, AV_LOG_DEBUG, "%u OpenCL devices found on " |
|
"platform \"%s\".\n", *nb_devices, platform_name); |
|
|
|
*devices = av_malloc_array(*nb_devices, sizeof(**devices)); |
|
if (!*devices) |
|
return AVERROR(ENOMEM); |
|
|
|
cle = clGetDeviceIDs(platform_id, CL_DEVICE_TYPE_ALL, |
|
*nb_devices, *devices, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get list of devices " |
|
"on platform \"%s\": %d.\n", platform_name, cle); |
|
av_freep(devices); |
|
return AVERROR(ENODEV); |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int opencl_filter_device(AVHWDeviceContext *hwdev, |
|
cl_device_id device_id, |
|
const char *device_name, |
|
void *context) |
|
{ |
|
AVDictionary *opts = context; |
|
const AVDictionaryEntry *param; |
|
char *str; |
|
int i, ret = 0; |
|
|
|
param = av_dict_get(opts, "device_type", NULL, 0); |
|
if (param) { |
|
cl_device_type match_type = 0, device_type; |
|
cl_int cle; |
|
|
|
for (i = 0; i < FF_ARRAY_ELEMS(opencl_device_types); i++) { |
|
if (!strcmp(opencl_device_types[i].key, param->value)) { |
|
match_type = opencl_device_types[i].type; |
|
break; |
|
} |
|
} |
|
if (!match_type) { |
|
av_log(hwdev, AV_LOG_ERROR, "Unknown device type %s.\n", |
|
param->value); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
cle = clGetDeviceInfo(device_id, CL_DEVICE_TYPE, |
|
sizeof(device_type), &device_type, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to query device type " |
|
"of device \"%s\".\n", device_name); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
if (!(device_type & match_type)) { |
|
av_log(hwdev, AV_LOG_DEBUG, "device_type does not match.\n"); |
|
return 1; |
|
} |
|
} |
|
|
|
for (i = 0; i < FF_ARRAY_ELEMS(opencl_device_params); i++) { |
|
param = av_dict_get(opts, opencl_device_params[i].key, |
|
NULL, 0); |
|
if (!param) |
|
continue; |
|
|
|
str = opencl_get_device_string(device_id, |
|
opencl_device_params[i].name); |
|
if (!str) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to query %s " |
|
"of device \"%s\".\n", |
|
opencl_device_params[i].key, device_name); |
|
return AVERROR_UNKNOWN; |
|
} |
|
if (!av_stristr(str, param->value)) { |
|
av_log(hwdev, AV_LOG_DEBUG, "%s does not match (\"%s\").\n", |
|
param->key, str); |
|
ret = 1; |
|
} |
|
av_free(str); |
|
} |
|
|
|
return ret; |
|
} |
|
|
|
typedef struct OpenCLDeviceSelector { |
|
int platform_index; |
|
int device_index; |
|
void *context; |
|
int (*enumerate_platforms)(AVHWDeviceContext *hwdev, |
|
cl_uint *nb_platforms, |
|
cl_platform_id **platforms, |
|
void *context); |
|
int (*filter_platform) (AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
void *context); |
|
int (*enumerate_devices) (AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
cl_uint *nb_devices, |
|
cl_device_id **devices, |
|
void *context); |
|
int (*filter_device) (AVHWDeviceContext *hwdev, |
|
cl_device_id device_id, |
|
const char *device_name, |
|
void *context); |
|
} OpenCLDeviceSelector; |
|
|
|
static int opencl_device_create_internal(AVHWDeviceContext *hwdev, |
|
const OpenCLDeviceSelector *selector, |
|
cl_context_properties *props) |
|
{ |
|
cl_uint nb_platforms; |
|
cl_platform_id *platforms = NULL; |
|
cl_platform_id platform_id; |
|
cl_uint nb_devices; |
|
cl_device_id *devices = NULL; |
|
AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
|
cl_int cle; |
|
cl_context_properties default_props[3]; |
|
char *platform_name_src = NULL, |
|
*device_name_src = NULL; |
|
int err, found, p, d; |
|
|
|
av_assert0(selector->enumerate_platforms && |
|
selector->enumerate_devices); |
|
|
|
err = selector->enumerate_platforms(hwdev, &nb_platforms, &platforms, |
|
selector->context); |
|
if (err) |
|
return err; |
|
|
|
found = 0; |
|
for (p = 0; p < nb_platforms; p++) { |
|
const char *platform_name; |
|
|
|
if (selector->platform_index >= 0 && |
|
selector->platform_index != p) |
|
continue; |
|
|
|
av_freep(&platform_name_src); |
|
platform_name_src = opencl_get_platform_string(platforms[p], |
|
CL_PLATFORM_NAME); |
|
if (platform_name_src) |
|
platform_name = platform_name_src; |
|
else |
|
platform_name = "Unknown Platform"; |
|
|
|
if (selector->filter_platform) { |
|
err = selector->filter_platform(hwdev, platforms[p], |
|
platform_name, |
|
selector->context); |
|
if (err < 0) |
|
goto fail; |
|
if (err > 0) |
|
continue; |
|
} |
|
|
|
err = selector->enumerate_devices(hwdev, platforms[p], platform_name, |
|
&nb_devices, &devices, |
|
selector->context); |
|
if (err < 0) |
|
continue; |
|
|
|
for (d = 0; d < nb_devices; d++) { |
|
const char *device_name; |
|
|
|
if (selector->device_index >= 0 && |
|
selector->device_index != d) |
|
continue; |
|
|
|
av_freep(&device_name_src); |
|
device_name_src = opencl_get_device_string(devices[d], |
|
CL_DEVICE_NAME); |
|
if (device_name_src) |
|
device_name = device_name_src; |
|
else |
|
device_name = "Unknown Device"; |
|
|
|
if (selector->filter_device) { |
|
err = selector->filter_device(hwdev, devices[d], |
|
device_name, |
|
selector->context); |
|
if (err < 0) |
|
goto fail; |
|
if (err > 0) |
|
continue; |
|
} |
|
|
|
av_log(hwdev, AV_LOG_VERBOSE, "%d.%d: %s / %s\n", p, d, |
|
platform_name, device_name); |
|
|
|
++found; |
|
platform_id = platforms[p]; |
|
hwctx->device_id = devices[d]; |
|
} |
|
|
|
av_freep(&devices); |
|
} |
|
|
|
if (found == 0) { |
|
av_log(hwdev, AV_LOG_ERROR, "No matching devices found.\n"); |
|
err = AVERROR(ENODEV); |
|
goto fail; |
|
} |
|
if (found > 1) { |
|
av_log(hwdev, AV_LOG_ERROR, "More than one matching device found.\n"); |
|
err = AVERROR(ENODEV); |
|
goto fail; |
|
} |
|
|
|
if (!props) { |
|
props = default_props; |
|
default_props[0] = CL_CONTEXT_PLATFORM; |
|
default_props[1] = (intptr_t)platform_id; |
|
default_props[2] = 0; |
|
} else { |
|
if (props[0] == CL_CONTEXT_PLATFORM && props[1] == 0) |
|
props[1] = (intptr_t)platform_id; |
|
} |
|
|
|
hwctx->context = clCreateContext(props, 1, &hwctx->device_id, |
|
&opencl_error_callback, hwdev, &cle); |
|
if (!hwctx->context) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to create OpenCL context: " |
|
"%d.\n", cle); |
|
err = AVERROR(ENODEV); |
|
goto fail; |
|
} |
|
|
|
hwdev->free = &opencl_device_free; |
|
|
|
err = 0; |
|
fail: |
|
av_freep(&platform_name_src); |
|
av_freep(&device_name_src); |
|
av_freep(&platforms); |
|
av_freep(&devices); |
|
return err; |
|
} |
|
|
|
static int opencl_device_create(AVHWDeviceContext *hwdev, const char *device, |
|
AVDictionary *opts, int flags) |
|
{ |
|
OpenCLDeviceSelector selector = { |
|
.context = opts, |
|
.enumerate_platforms = &opencl_enumerate_platforms, |
|
.filter_platform = &opencl_filter_platform, |
|
.enumerate_devices = &opencl_enumerate_devices, |
|
.filter_device = &opencl_filter_device, |
|
}; |
|
|
|
if (device && device[0]) { |
|
// Match one or both indices for platform and device. |
|
int d = -1, p = -1, ret; |
|
if (device[0] == '.') |
|
ret = sscanf(device, ".%d", &d); |
|
else |
|
ret = sscanf(device, "%d.%d", &p, &d); |
|
if (ret < 1) { |
|
av_log(hwdev, AV_LOG_ERROR, "Invalid OpenCL platform/device " |
|
"index specification \"%s\".\n", device); |
|
return AVERROR(EINVAL); |
|
} |
|
selector.platform_index = p; |
|
selector.device_index = d; |
|
} else { |
|
selector.platform_index = -1; |
|
selector.device_index = -1; |
|
} |
|
|
|
return opencl_device_create_internal(hwdev, &selector, NULL); |
|
} |
|
|
|
static int opencl_device_init(AVHWDeviceContext *hwdev) |
|
{ |
|
AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
|
OpenCLDeviceContext *priv = hwdev->internal->priv; |
|
cl_int cle; |
|
|
|
if (hwctx->command_queue) { |
|
cle = clRetainCommandQueue(hwctx->command_queue); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to retain external " |
|
"command queue: %d.\n", cle); |
|
return AVERROR(EIO); |
|
} |
|
priv->command_queue = hwctx->command_queue; |
|
} else { |
|
priv->command_queue = clCreateCommandQueue(hwctx->context, |
|
hwctx->device_id, |
|
0, &cle); |
|
if (!priv->command_queue) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to create internal " |
|
"command queue: %d.\n", cle); |
|
return AVERROR(EIO); |
|
} |
|
} |
|
|
|
cle = clGetDeviceInfo(hwctx->device_id, CL_DEVICE_PLATFORM, |
|
sizeof(priv->platform_id), &priv->platform_id, |
|
NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to determine the OpenCL " |
|
"platform containing the device.\n"); |
|
return AVERROR(EIO); |
|
} |
|
|
|
#define CL_FUNC(name, desc) do { \ |
|
if (fail) \ |
|
break; \ |
|
priv->name = clGetExtensionFunctionAddressForPlatform( \ |
|
priv->platform_id, #name); \ |
|
if (!priv->name) { \ |
|
av_log(hwdev, AV_LOG_VERBOSE, \ |
|
desc " function not found (%s).\n", #name); \ |
|
fail = 1; \ |
|
} else { \ |
|
av_log(hwdev, AV_LOG_VERBOSE, \ |
|
desc " function found (%s).\n", #name); \ |
|
} \ |
|
} while (0) |
|
|
|
#if HAVE_OPENCL_DRM_BEIGNET |
|
{ |
|
int fail = 0; |
|
|
|
CL_FUNC(clCreateImageFromFdINTEL, |
|
"Beignet DRM to OpenCL image mapping"); |
|
|
|
if (fail) { |
|
av_log(hwdev, AV_LOG_WARNING, "Beignet DRM to OpenCL " |
|
"mapping not usable.\n"); |
|
priv->beignet_drm_mapping_usable = 0; |
|
} else { |
|
priv->beignet_drm_mapping_usable = 1; |
|
} |
|
} |
|
#endif |
|
|
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
|
{ |
|
size_t props_size; |
|
cl_context_properties *props = NULL; |
|
VADisplay va_display; |
|
const char *va_ext = "cl_intel_va_api_media_sharing"; |
|
int i, fail = 0; |
|
|
|
if (!opencl_check_extension(hwdev, va_ext)) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "The %s extension is " |
|
"required for QSV to OpenCL mapping.\n", va_ext); |
|
goto no_qsv; |
|
} |
|
|
|
cle = clGetContextInfo(hwctx->context, CL_CONTEXT_PROPERTIES, |
|
0, NULL, &props_size); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "Failed to get context " |
|
"properties: %d.\n", cle); |
|
goto no_qsv; |
|
} |
|
if (props_size == 0) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "Media sharing must be " |
|
"enabled on context creation to use QSV to " |
|
"OpenCL mapping.\n"); |
|
goto no_qsv; |
|
} |
|
|
|
props = av_malloc(props_size); |
|
if (!props) |
|
return AVERROR(ENOMEM); |
|
|
|
cle = clGetContextInfo(hwctx->context, CL_CONTEXT_PROPERTIES, |
|
props_size, props, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "Failed to get context " |
|
"properties: %d.\n", cle); |
|
goto no_qsv; |
|
} |
|
|
|
va_display = NULL; |
|
for (i = 0; i < (props_size / sizeof(*props) - 1); i++) { |
|
if (props[i] == CL_CONTEXT_VA_API_DISPLAY_INTEL) { |
|
va_display = (VADisplay)(intptr_t)props[i+1]; |
|
break; |
|
} |
|
} |
|
if (!va_display) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "Media sharing must be " |
|
"enabled on context creation to use QSV to " |
|
"OpenCL mapping.\n"); |
|
goto no_qsv; |
|
} |
|
if (!vaDisplayIsValid(va_display)) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "A valid VADisplay is " |
|
"required on context creation to use QSV to " |
|
"OpenCL mapping.\n"); |
|
goto no_qsv; |
|
} |
|
|
|
CL_FUNC(clCreateFromVA_APIMediaSurfaceINTEL, |
|
"Intel QSV to OpenCL mapping"); |
|
CL_FUNC(clEnqueueAcquireVA_APIMediaSurfacesINTEL, |
|
"Intel QSV in OpenCL acquire"); |
|
CL_FUNC(clEnqueueReleaseVA_APIMediaSurfacesINTEL, |
|
"Intel QSV in OpenCL release"); |
|
|
|
if (fail) { |
|
no_qsv: |
|
av_log(hwdev, AV_LOG_WARNING, "QSV to OpenCL mapping " |
|
"not usable.\n"); |
|
priv->qsv_mapping_usable = 0; |
|
} else { |
|
priv->qsv_mapping_usable = 1; |
|
} |
|
av_free(props); |
|
} |
|
#endif |
|
|
|
#if HAVE_OPENCL_DXVA2 |
|
{ |
|
int fail = 0; |
|
|
|
CL_FUNC(clCreateFromDX9MediaSurfaceKHR, |
|
"DXVA2 to OpenCL mapping"); |
|
CL_FUNC(clEnqueueAcquireDX9MediaSurfacesKHR, |
|
"DXVA2 in OpenCL acquire"); |
|
CL_FUNC(clEnqueueReleaseDX9MediaSurfacesKHR, |
|
"DXVA2 in OpenCL release"); |
|
|
|
if (fail) { |
|
av_log(hwdev, AV_LOG_WARNING, "DXVA2 to OpenCL mapping " |
|
"not usable.\n"); |
|
priv->dxva2_mapping_usable = 0; |
|
} else { |
|
priv->dx9_media_adapter_type = CL_ADAPTER_D3D9EX_KHR; |
|
priv->dxva2_mapping_usable = 1; |
|
} |
|
} |
|
#endif |
|
|
|
#if HAVE_OPENCL_D3D11 |
|
{ |
|
const char *d3d11_ext = "cl_khr_d3d11_sharing"; |
|
const char *nv12_ext = "cl_intel_d3d11_nv12_media_sharing"; |
|
int fail = 0; |
|
|
|
if (!opencl_check_extension(hwdev, d3d11_ext)) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "The %s extension is " |
|
"required for D3D11 to OpenCL mapping.\n", d3d11_ext); |
|
fail = 1; |
|
} else if (!opencl_check_extension(hwdev, nv12_ext)) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "The %s extension may be " |
|
"required for D3D11 to OpenCL mapping.\n", nv12_ext); |
|
// Not fatal. |
|
} |
|
|
|
CL_FUNC(clCreateFromD3D11Texture2DKHR, |
|
"D3D11 to OpenCL mapping"); |
|
CL_FUNC(clEnqueueAcquireD3D11ObjectsKHR, |
|
"D3D11 in OpenCL acquire"); |
|
CL_FUNC(clEnqueueReleaseD3D11ObjectsKHR, |
|
"D3D11 in OpenCL release"); |
|
|
|
if (fail) { |
|
av_log(hwdev, AV_LOG_WARNING, "D3D11 to OpenCL mapping " |
|
"not usable.\n"); |
|
priv->d3d11_mapping_usable = 0; |
|
} else { |
|
priv->d3d11_mapping_usable = 1; |
|
} |
|
} |
|
#endif |
|
|
|
#if HAVE_OPENCL_DRM_ARM |
|
{ |
|
const char *drm_arm_ext = "cl_arm_import_memory"; |
|
const char *image_ext = "cl_khr_image2d_from_buffer"; |
|
int fail = 0; |
|
|
|
if (!opencl_check_extension(hwdev, drm_arm_ext)) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "The %s extension is " |
|
"required for DRM to OpenCL mapping on ARM.\n", |
|
drm_arm_ext); |
|
fail = 1; |
|
} |
|
if (!opencl_check_extension(hwdev, image_ext)) { |
|
av_log(hwdev, AV_LOG_VERBOSE, "The %s extension is " |
|
"required for DRM to OpenCL mapping on ARM.\n", |
|
image_ext); |
|
fail = 1; |
|
} |
|
|
|
// clImportMemoryARM() is linked statically. |
|
|
|
if (fail) { |
|
av_log(hwdev, AV_LOG_WARNING, "DRM to OpenCL mapping on ARM " |
|
"not usable.\n"); |
|
priv->drm_arm_mapping_usable = 0; |
|
} else { |
|
priv->drm_arm_mapping_usable = 1; |
|
} |
|
} |
|
#endif |
|
|
|
#undef CL_FUNC |
|
|
|
return 0; |
|
} |
|
|
|
static void opencl_device_uninit(AVHWDeviceContext *hwdev) |
|
{ |
|
OpenCLDeviceContext *priv = hwdev->internal->priv; |
|
cl_int cle; |
|
|
|
if (priv->command_queue) { |
|
cle = clReleaseCommandQueue(priv->command_queue); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to release internal " |
|
"command queue reference: %d.\n", cle); |
|
} |
|
priv->command_queue = NULL; |
|
} |
|
} |
|
|
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
|
static int opencl_filter_intel_media_vaapi_platform(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
void *context) |
|
{ |
|
// This doesn't exist as a platform extension, so just test whether |
|
// the function we will use for device enumeration exists. |
|
|
|
if (!clGetExtensionFunctionAddressForPlatform(platform_id, |
|
"clGetDeviceIDsFromVA_APIMediaAdapterINTEL")) { |
|
av_log(hwdev, AV_LOG_DEBUG, "Platform %s does not export the " |
|
"VAAPI device enumeration function.\n", platform_name); |
|
return 1; |
|
} else { |
|
return 0; |
|
} |
|
} |
|
|
|
static int opencl_enumerate_intel_media_vaapi_devices(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
cl_uint *nb_devices, |
|
cl_device_id **devices, |
|
void *context) |
|
{ |
|
VADisplay va_display = context; |
|
clGetDeviceIDsFromVA_APIMediaAdapterINTEL_fn |
|
clGetDeviceIDsFromVA_APIMediaAdapterINTEL; |
|
cl_int cle; |
|
|
|
clGetDeviceIDsFromVA_APIMediaAdapterINTEL = |
|
clGetExtensionFunctionAddressForPlatform(platform_id, |
|
"clGetDeviceIDsFromVA_APIMediaAdapterINTEL"); |
|
if (!clGetDeviceIDsFromVA_APIMediaAdapterINTEL) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get address of " |
|
"clGetDeviceIDsFromVA_APIMediaAdapterINTEL().\n"); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
cle = clGetDeviceIDsFromVA_APIMediaAdapterINTEL( |
|
platform_id, CL_VA_API_DISPLAY_INTEL, va_display, |
|
CL_PREFERRED_DEVICES_FOR_VA_API_INTEL, 0, NULL, nb_devices); |
|
if (cle == CL_DEVICE_NOT_FOUND) { |
|
av_log(hwdev, AV_LOG_DEBUG, "No VAAPI-supporting devices found " |
|
"on platform \"%s\".\n", platform_name); |
|
*nb_devices = 0; |
|
return 0; |
|
} else if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get number of devices " |
|
"on platform \"%s\": %d.\n", platform_name, cle); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
*devices = av_malloc_array(*nb_devices, sizeof(**devices)); |
|
if (!*devices) |
|
return AVERROR(ENOMEM); |
|
|
|
cle = clGetDeviceIDsFromVA_APIMediaAdapterINTEL( |
|
platform_id, CL_VA_API_DISPLAY_INTEL, va_display, |
|
CL_PREFERRED_DEVICES_FOR_VA_API_INTEL, *nb_devices, *devices, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get list of VAAPI-supporting " |
|
"devices on platform \"%s\": %d.\n", platform_name, cle); |
|
av_freep(devices); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int opencl_filter_intel_media_vaapi_device(AVHWDeviceContext *hwdev, |
|
cl_device_id device_id, |
|
const char *device_name, |
|
void *context) |
|
{ |
|
const char *va_ext = "cl_intel_va_api_media_sharing"; |
|
|
|
if (opencl_check_device_extension(device_id, va_ext)) { |
|
return 0; |
|
} else { |
|
av_log(hwdev, AV_LOG_DEBUG, "Device %s does not support the " |
|
"%s extension.\n", device_name, va_ext); |
|
return 1; |
|
} |
|
} |
|
#endif |
|
|
|
#if HAVE_OPENCL_DXVA2 |
|
static int opencl_filter_dxva2_platform(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
void *context) |
|
{ |
|
const char *dx9_ext = "cl_khr_dx9_media_sharing"; |
|
|
|
if (opencl_check_platform_extension(platform_id, dx9_ext)) { |
|
return 0; |
|
} else { |
|
av_log(hwdev, AV_LOG_DEBUG, "Platform %s does not support the " |
|
"%s extension.\n", platform_name, dx9_ext); |
|
return 1; |
|
} |
|
} |
|
|
|
static int opencl_enumerate_dxva2_devices(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
cl_uint *nb_devices, |
|
cl_device_id **devices, |
|
void *context) |
|
{ |
|
IDirect3DDevice9 *device = context; |
|
clGetDeviceIDsFromDX9MediaAdapterKHR_fn |
|
clGetDeviceIDsFromDX9MediaAdapterKHR; |
|
cl_dx9_media_adapter_type_khr media_adapter_type = CL_ADAPTER_D3D9EX_KHR; |
|
cl_int cle; |
|
|
|
clGetDeviceIDsFromDX9MediaAdapterKHR = |
|
clGetExtensionFunctionAddressForPlatform(platform_id, |
|
"clGetDeviceIDsFromDX9MediaAdapterKHR"); |
|
if (!clGetDeviceIDsFromDX9MediaAdapterKHR) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get address of " |
|
"clGetDeviceIDsFromDX9MediaAdapterKHR().\n"); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
cle = clGetDeviceIDsFromDX9MediaAdapterKHR( |
|
platform_id, 1, &media_adapter_type, (void**)&device, |
|
CL_PREFERRED_DEVICES_FOR_DX9_MEDIA_ADAPTER_KHR, |
|
0, NULL, nb_devices); |
|
if (cle == CL_DEVICE_NOT_FOUND) { |
|
av_log(hwdev, AV_LOG_DEBUG, "No DXVA2-supporting devices found " |
|
"on platform \"%s\".\n", platform_name); |
|
*nb_devices = 0; |
|
return 0; |
|
} else if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get number of devices " |
|
"on platform \"%s\": %d.\n", platform_name, cle); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
*devices = av_malloc_array(*nb_devices, sizeof(**devices)); |
|
if (!*devices) |
|
return AVERROR(ENOMEM); |
|
|
|
cle = clGetDeviceIDsFromDX9MediaAdapterKHR( |
|
platform_id, 1, &media_adapter_type, (void**)&device, |
|
CL_PREFERRED_DEVICES_FOR_DX9_MEDIA_ADAPTER_KHR, |
|
*nb_devices, *devices, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get list of DXVA2-supporting " |
|
"devices on platform \"%s\": %d.\n", platform_name, cle); |
|
av_freep(devices); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
return 0; |
|
} |
|
#endif |
|
|
|
#if HAVE_OPENCL_D3D11 |
|
static int opencl_filter_d3d11_platform(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
void *context) |
|
{ |
|
const char *d3d11_ext = "cl_khr_d3d11_sharing"; |
|
|
|
if (opencl_check_platform_extension(platform_id, d3d11_ext)) { |
|
return 0; |
|
} else { |
|
av_log(hwdev, AV_LOG_DEBUG, "Platform %s does not support the " |
|
"%s extension.\n", platform_name, d3d11_ext); |
|
return 1; |
|
} |
|
} |
|
|
|
static int opencl_enumerate_d3d11_devices(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
cl_uint *nb_devices, |
|
cl_device_id **devices, |
|
void *context) |
|
{ |
|
ID3D11Device *device = context; |
|
clGetDeviceIDsFromD3D11KHR_fn clGetDeviceIDsFromD3D11KHR; |
|
cl_int cle; |
|
|
|
clGetDeviceIDsFromD3D11KHR = |
|
clGetExtensionFunctionAddressForPlatform(platform_id, |
|
"clGetDeviceIDsFromD3D11KHR"); |
|
if (!clGetDeviceIDsFromD3D11KHR) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get address of " |
|
"clGetDeviceIDsFromD3D11KHR().\n"); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
cle = clGetDeviceIDsFromD3D11KHR(platform_id, |
|
CL_D3D11_DEVICE_KHR, device, |
|
CL_PREFERRED_DEVICES_FOR_D3D11_KHR, |
|
0, NULL, nb_devices); |
|
if (cle == CL_DEVICE_NOT_FOUND) { |
|
av_log(hwdev, AV_LOG_DEBUG, "No D3D11-supporting devices found " |
|
"on platform \"%s\".\n", platform_name); |
|
*nb_devices = 0; |
|
return 0; |
|
} else if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get number of devices " |
|
"on platform \"%s\": %d.\n", platform_name, cle); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
*devices = av_malloc_array(*nb_devices, sizeof(**devices)); |
|
if (!*devices) |
|
return AVERROR(ENOMEM); |
|
|
|
cle = clGetDeviceIDsFromD3D11KHR(platform_id, |
|
CL_D3D11_DEVICE_KHR, device, |
|
CL_PREFERRED_DEVICES_FOR_D3D11_KHR, |
|
*nb_devices, *devices, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to get list of D3D11-supporting " |
|
"devices on platform \"%s\": %d.\n", platform_name, cle); |
|
av_freep(devices); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
return 0; |
|
} |
|
#endif |
|
|
|
#if HAVE_OPENCL_DXVA2 || HAVE_OPENCL_D3D11 |
|
static int opencl_filter_gpu_device(AVHWDeviceContext *hwdev, |
|
cl_device_id device_id, |
|
const char *device_name, |
|
void *context) |
|
{ |
|
cl_device_type device_type; |
|
cl_int cle; |
|
|
|
cle = clGetDeviceInfo(device_id, CL_DEVICE_TYPE, |
|
sizeof(device_type), &device_type, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to query device type " |
|
"of device \"%s\".\n", device_name); |
|
return AVERROR_UNKNOWN; |
|
} |
|
if (!(device_type & CL_DEVICE_TYPE_GPU)) { |
|
av_log(hwdev, AV_LOG_DEBUG, "Device %s skipped (not GPU).\n", |
|
device_name); |
|
return 1; |
|
} |
|
|
|
return 0; |
|
} |
|
#endif |
|
|
|
#if HAVE_OPENCL_DRM_ARM |
|
static int opencl_filter_drm_arm_platform(AVHWDeviceContext *hwdev, |
|
cl_platform_id platform_id, |
|
const char *platform_name, |
|
void *context) |
|
{ |
|
const char *drm_arm_ext = "cl_arm_import_memory"; |
|
|
|
if (opencl_check_platform_extension(platform_id, drm_arm_ext)) { |
|
return 0; |
|
} else { |
|
av_log(hwdev, AV_LOG_DEBUG, "Platform %s does not support the " |
|
"%s extension.\n", platform_name, drm_arm_ext); |
|
return 1; |
|
} |
|
} |
|
|
|
static int opencl_filter_drm_arm_device(AVHWDeviceContext *hwdev, |
|
cl_device_id device_id, |
|
const char *device_name, |
|
void *context) |
|
{ |
|
const char *drm_arm_ext = "cl_arm_import_memory"; |
|
|
|
if (opencl_check_device_extension(device_id, drm_arm_ext)) { |
|
return 0; |
|
} else { |
|
av_log(hwdev, AV_LOG_DEBUG, "Device %s does not support the " |
|
"%s extension.\n", device_name, drm_arm_ext); |
|
return 1; |
|
} |
|
} |
|
#endif |
|
|
|
static int opencl_device_derive(AVHWDeviceContext *hwdev, |
|
AVHWDeviceContext *src_ctx, AVDictionary *opts, |
|
int flags) |
|
{ |
|
int err; |
|
switch (src_ctx->type) { |
|
|
|
#if HAVE_OPENCL_DRM_BEIGNET |
|
case AV_HWDEVICE_TYPE_DRM: |
|
case AV_HWDEVICE_TYPE_VAAPI: |
|
{ |
|
// Surface mapping works via DRM PRIME fds with no special |
|
// initialisation required in advance. This just finds the |
|
// Beignet ICD by name. |
|
AVDictionary *selector_opts = NULL; |
|
|
|
err = av_dict_set(&selector_opts, "platform_vendor", "Intel", 0); |
|
if (err >= 0) |
|
err = av_dict_set(&selector_opts, "platform_version", "beignet", 0); |
|
if (err >= 0) { |
|
OpenCLDeviceSelector selector = { |
|
.platform_index = -1, |
|
.device_index = 0, |
|
.context = selector_opts, |
|
.enumerate_platforms = &opencl_enumerate_platforms, |
|
.filter_platform = &opencl_filter_platform, |
|
.enumerate_devices = &opencl_enumerate_devices, |
|
.filter_device = NULL, |
|
}; |
|
err = opencl_device_create_internal(hwdev, &selector, NULL); |
|
} |
|
av_dict_free(&selector_opts); |
|
} |
|
break; |
|
#endif |
|
|
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
|
// The generic code automatically attempts to derive from all |
|
// ancestors of the given device, so we can ignore QSV devices here |
|
// and just consider the inner VAAPI device it was derived from. |
|
case AV_HWDEVICE_TYPE_VAAPI: |
|
{ |
|
AVVAAPIDeviceContext *src_hwctx = src_ctx->hwctx; |
|
cl_context_properties props[7] = { |
|
CL_CONTEXT_PLATFORM, |
|
0, |
|
CL_CONTEXT_VA_API_DISPLAY_INTEL, |
|
(intptr_t)src_hwctx->display, |
|
CL_CONTEXT_INTEROP_USER_SYNC, |
|
CL_FALSE, |
|
0, |
|
}; |
|
OpenCLDeviceSelector selector = { |
|
.platform_index = -1, |
|
.device_index = -1, |
|
.context = src_hwctx->display, |
|
.enumerate_platforms = &opencl_enumerate_platforms, |
|
.filter_platform = &opencl_filter_intel_media_vaapi_platform, |
|
.enumerate_devices = &opencl_enumerate_intel_media_vaapi_devices, |
|
.filter_device = &opencl_filter_intel_media_vaapi_device, |
|
}; |
|
|
|
err = opencl_device_create_internal(hwdev, &selector, props); |
|
} |
|
break; |
|
#endif |
|
|
|
#if HAVE_OPENCL_DXVA2 |
|
case AV_HWDEVICE_TYPE_DXVA2: |
|
{ |
|
AVDXVA2DeviceContext *src_hwctx = src_ctx->hwctx; |
|
IDirect3DDevice9 *device; |
|
HANDLE device_handle; |
|
HRESULT hr; |
|
|
|
hr = IDirect3DDeviceManager9_OpenDeviceHandle(src_hwctx->devmgr, |
|
&device_handle); |
|
if (FAILED(hr)) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to open device handle " |
|
"for Direct3D9 device: %lx.\n", (unsigned long)hr); |
|
err = AVERROR_UNKNOWN; |
|
break; |
|
} |
|
|
|
hr = IDirect3DDeviceManager9_LockDevice(src_hwctx->devmgr, |
|
device_handle, |
|
&device, FALSE); |
|
if (SUCCEEDED(hr)) { |
|
cl_context_properties props[5] = { |
|
CL_CONTEXT_PLATFORM, |
|
0, |
|
CL_CONTEXT_ADAPTER_D3D9EX_KHR, |
|
(intptr_t)device, |
|
0, |
|
}; |
|
OpenCLDeviceSelector selector = { |
|
.platform_index = -1, |
|
.device_index = -1, |
|
.context = device, |
|
.enumerate_platforms = &opencl_enumerate_platforms, |
|
.filter_platform = &opencl_filter_dxva2_platform, |
|
.enumerate_devices = &opencl_enumerate_dxva2_devices, |
|
.filter_device = &opencl_filter_gpu_device, |
|
}; |
|
|
|
err = opencl_device_create_internal(hwdev, &selector, props); |
|
|
|
IDirect3DDeviceManager9_UnlockDevice(src_hwctx->devmgr, |
|
device_handle, FALSE); |
|
} else { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to lock device handle " |
|
"for Direct3D9 device: %lx.\n", (unsigned long)hr); |
|
err = AVERROR_UNKNOWN; |
|
} |
|
|
|
IDirect3DDeviceManager9_CloseDeviceHandle(src_hwctx->devmgr, |
|
device_handle); |
|
} |
|
break; |
|
#endif |
|
|
|
#if HAVE_OPENCL_D3D11 |
|
case AV_HWDEVICE_TYPE_D3D11VA: |
|
{ |
|
AVD3D11VADeviceContext *src_hwctx = src_ctx->hwctx; |
|
cl_context_properties props[5] = { |
|
CL_CONTEXT_PLATFORM, |
|
0, |
|
CL_CONTEXT_D3D11_DEVICE_KHR, |
|
(intptr_t)src_hwctx->device, |
|
0, |
|
}; |
|
OpenCLDeviceSelector selector = { |
|
.platform_index = -1, |
|
.device_index = -1, |
|
.context = src_hwctx->device, |
|
.enumerate_platforms = &opencl_enumerate_platforms, |
|
.filter_platform = &opencl_filter_d3d11_platform, |
|
.enumerate_devices = &opencl_enumerate_d3d11_devices, |
|
.filter_device = &opencl_filter_gpu_device, |
|
}; |
|
|
|
err = opencl_device_create_internal(hwdev, &selector, props); |
|
} |
|
break; |
|
#endif |
|
|
|
#if HAVE_OPENCL_DRM_ARM |
|
case AV_HWDEVICE_TYPE_DRM: |
|
{ |
|
OpenCLDeviceSelector selector = { |
|
.platform_index = -1, |
|
.device_index = -1, |
|
.context = NULL, |
|
.enumerate_platforms = &opencl_enumerate_platforms, |
|
.filter_platform = &opencl_filter_drm_arm_platform, |
|
.enumerate_devices = &opencl_enumerate_devices, |
|
.filter_device = &opencl_filter_drm_arm_device, |
|
}; |
|
|
|
err = opencl_device_create_internal(hwdev, &selector, NULL); |
|
} |
|
break; |
|
#endif |
|
|
|
default: |
|
err = AVERROR(ENOSYS); |
|
break; |
|
} |
|
|
|
return err; |
|
} |
|
|
|
static int opencl_get_plane_format(enum AVPixelFormat pixfmt, |
|
int plane, int width, int height, |
|
cl_image_format *image_format, |
|
cl_image_desc *image_desc) |
|
{ |
|
const AVPixFmtDescriptor *desc; |
|
const AVComponentDescriptor *comp; |
|
int channels = 0, order = 0, depth = 0, step = 0; |
|
int wsub, hsub, alpha; |
|
int c; |
|
|
|
if (plane >= AV_NUM_DATA_POINTERS) |
|
return AVERROR(ENOENT); |
|
|
|
desc = av_pix_fmt_desc_get(pixfmt); |
|
|
|
// Only normal images are allowed. |
|
if (desc->flags & (AV_PIX_FMT_FLAG_BITSTREAM | |
|
AV_PIX_FMT_FLAG_HWACCEL | |
|
AV_PIX_FMT_FLAG_PAL)) |
|
return AVERROR(EINVAL); |
|
|
|
wsub = 1 << desc->log2_chroma_w; |
|
hsub = 1 << desc->log2_chroma_h; |
|
// Subsampled components must be exact. |
|
if (width & wsub - 1 || height & hsub - 1) |
|
return AVERROR(EINVAL); |
|
|
|
for (c = 0; c < desc->nb_components; c++) { |
|
comp = &desc->comp[c]; |
|
if (comp->plane != plane) |
|
continue; |
|
// The step size must be a power of two. |
|
if (comp->step != 1 && comp->step != 2 && |
|
comp->step != 4 && comp->step != 8) |
|
return AVERROR(EINVAL); |
|
// The bits in each component must be packed in the |
|
// most-significant-bits of the relevant bytes. |
|
if (comp->shift + comp->depth != 8 && |
|
comp->shift + comp->depth != 16) |
|
return AVERROR(EINVAL); |
|
// The depth must not vary between components. |
|
if (depth && comp->depth != depth) |
|
return AVERROR(EINVAL); |
|
// If a single data element crosses multiple bytes then |
|
// it must match the native endianness. |
|
if (comp->depth > 8 && |
|
HAVE_BIGENDIAN == !(desc->flags & AV_PIX_FMT_FLAG_BE)) |
|
return AVERROR(EINVAL); |
|
// A single data element must not contain multiple samples |
|
// from the same component. |
|
if (step && comp->step != step) |
|
return AVERROR(EINVAL); |
|
|
|
depth = comp->depth; |
|
order = order * 10 + comp->offset / ((depth + 7) / 8) + 1; |
|
step = comp->step; |
|
alpha = (desc->flags & AV_PIX_FMT_FLAG_ALPHA && |
|
c == desc->nb_components - 1); |
|
++channels; |
|
} |
|
if (channels == 0) |
|
return AVERROR(ENOENT); |
|
|
|
memset(image_format, 0, sizeof(*image_format)); |
|
memset(image_desc, 0, sizeof(*image_desc)); |
|
image_desc->image_type = CL_MEM_OBJECT_IMAGE2D; |
|
|
|
if (plane == 0 || alpha) { |
|
image_desc->image_width = width; |
|
image_desc->image_height = height; |
|
image_desc->image_row_pitch = step * width; |
|
} else { |
|
image_desc->image_width = width / wsub; |
|
image_desc->image_height = height / hsub; |
|
image_desc->image_row_pitch = step * width / wsub; |
|
} |
|
|
|
if (depth <= 8) { |
|
image_format->image_channel_data_type = CL_UNORM_INT8; |
|
} else { |
|
if (depth <= 16) |
|
image_format->image_channel_data_type = CL_UNORM_INT16; |
|
else |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
#define CHANNEL_ORDER(order, type) \ |
|
case order: image_format->image_channel_order = type; break; |
|
switch (order) { |
|
CHANNEL_ORDER(1, CL_R); |
|
CHANNEL_ORDER(12, CL_RG); |
|
CHANNEL_ORDER(1234, CL_RGBA); |
|
CHANNEL_ORDER(2341, CL_ARGB); |
|
CHANNEL_ORDER(3214, CL_BGRA); |
|
#ifdef CL_ABGR |
|
CHANNEL_ORDER(4321, CL_ABGR); |
|
#endif |
|
default: |
|
return AVERROR(EINVAL); |
|
} |
|
#undef CHANNEL_ORDER |
|
|
|
return 0; |
|
} |
|
|
|
static int opencl_frames_get_constraints(AVHWDeviceContext *hwdev, |
|
const void *hwconfig, |
|
AVHWFramesConstraints *constraints) |
|
{ |
|
AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
|
cl_uint nb_image_formats; |
|
cl_image_format *image_formats = NULL; |
|
cl_int cle; |
|
enum AVPixelFormat pix_fmt; |
|
int err, pix_fmts_found; |
|
size_t max_width, max_height; |
|
|
|
cle = clGetDeviceInfo(hwctx->device_id, CL_DEVICE_IMAGE2D_MAX_WIDTH, |
|
sizeof(max_width), &max_width, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to query maximum " |
|
"supported image width: %d.\n", cle); |
|
} else { |
|
constraints->max_width = max_width; |
|
} |
|
cle = clGetDeviceInfo(hwctx->device_id, CL_DEVICE_IMAGE2D_MAX_HEIGHT, |
|
sizeof(max_height), &max_height, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to query maximum " |
|
"supported image height: %d.\n", cle); |
|
} else { |
|
constraints->max_height = max_height; |
|
} |
|
av_log(hwdev, AV_LOG_DEBUG, "Maximum supported image size %dx%d.\n", |
|
constraints->max_width, constraints->max_height); |
|
|
|
cle = clGetSupportedImageFormats(hwctx->context, |
|
CL_MEM_READ_WRITE, |
|
CL_MEM_OBJECT_IMAGE2D, |
|
0, NULL, &nb_image_formats); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to query supported " |
|
"image formats: %d.\n", cle); |
|
err = AVERROR(ENOSYS); |
|
goto fail; |
|
} |
|
if (nb_image_formats == 0) { |
|
av_log(hwdev, AV_LOG_ERROR, "No image support in OpenCL " |
|
"driver (zero supported image formats).\n"); |
|
err = AVERROR(ENOSYS); |
|
goto fail; |
|
} |
|
|
|
image_formats = |
|
av_malloc_array(nb_image_formats, sizeof(*image_formats)); |
|
if (!image_formats) { |
|
err = AVERROR(ENOMEM); |
|
goto fail; |
|
} |
|
|
|
cle = clGetSupportedImageFormats(hwctx->context, |
|
CL_MEM_READ_WRITE, |
|
CL_MEM_OBJECT_IMAGE2D, |
|
nb_image_formats, |
|
image_formats, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwdev, AV_LOG_ERROR, "Failed to query supported " |
|
"image formats: %d.\n", cle); |
|
err = AVERROR(ENOSYS); |
|
goto fail; |
|
} |
|
|
|
pix_fmts_found = 0; |
|
for (pix_fmt = 0; pix_fmt < AV_PIX_FMT_NB; pix_fmt++) { |
|
cl_image_format image_format; |
|
cl_image_desc image_desc; |
|
int plane, i; |
|
|
|
for (plane = 0;; plane++) { |
|
err = opencl_get_plane_format(pix_fmt, plane, 0, 0, |
|
&image_format, |
|
&image_desc); |
|
if (err < 0) |
|
break; |
|
|
|
for (i = 0; i < nb_image_formats; i++) { |
|
if (image_formats[i].image_channel_order == |
|
image_format.image_channel_order && |
|
image_formats[i].image_channel_data_type == |
|
image_format.image_channel_data_type) |
|
break; |
|
} |
|
if (i == nb_image_formats) { |
|
err = AVERROR(EINVAL); |
|
break; |
|
} |
|
} |
|
if (err != AVERROR(ENOENT)) |
|
continue; |
|
|
|
av_log(hwdev, AV_LOG_DEBUG, "Format %s supported.\n", |
|
av_get_pix_fmt_name(pix_fmt)); |
|
|
|
err = av_reallocp_array(&constraints->valid_sw_formats, |
|
pix_fmts_found + 2, |
|
sizeof(*constraints->valid_sw_formats)); |
|
if (err < 0) |
|
goto fail; |
|
constraints->valid_sw_formats[pix_fmts_found] = pix_fmt; |
|
constraints->valid_sw_formats[pix_fmts_found + 1] = |
|
AV_PIX_FMT_NONE; |
|
++pix_fmts_found; |
|
} |
|
|
|
av_freep(&image_formats); |
|
|
|
constraints->valid_hw_formats = |
|
av_malloc_array(2, sizeof(*constraints->valid_hw_formats)); |
|
if (!constraints->valid_hw_formats) { |
|
err = AVERROR(ENOMEM); |
|
goto fail; |
|
} |
|
constraints->valid_hw_formats[0] = AV_PIX_FMT_OPENCL; |
|
constraints->valid_hw_formats[1] = AV_PIX_FMT_NONE; |
|
|
|
return 0; |
|
|
|
fail: |
|
av_freep(&image_formats); |
|
return err; |
|
} |
|
|
|
static void opencl_pool_free(void *opaque, uint8_t *data) |
|
{ |
|
AVHWFramesContext *hwfc = opaque; |
|
AVOpenCLFrameDescriptor *desc = (AVOpenCLFrameDescriptor*)data; |
|
cl_int cle; |
|
int p; |
|
|
|
for (p = 0; p < desc->nb_planes; p++) { |
|
cle = clReleaseMemObject(desc->planes[p]); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to release plane %d: " |
|
"%d.\n", p, cle); |
|
} |
|
} |
|
|
|
av_free(desc); |
|
} |
|
|
|
static AVBufferRef *opencl_pool_alloc(void *opaque, size_t size) |
|
{ |
|
AVHWFramesContext *hwfc = opaque; |
|
AVOpenCLDeviceContext *hwctx = hwfc->device_ctx->hwctx; |
|
AVOpenCLFrameDescriptor *desc; |
|
cl_int cle; |
|
cl_mem image; |
|
cl_image_format image_format; |
|
cl_image_desc image_desc; |
|
int err, p; |
|
AVBufferRef *ref; |
|
|
|
desc = av_mallocz(sizeof(*desc)); |
|
if (!desc) |
|
return NULL; |
|
|
|
for (p = 0;; p++) { |
|
err = opencl_get_plane_format(hwfc->sw_format, p, |
|
hwfc->width, hwfc->height, |
|
&image_format, &image_desc); |
|
if (err == AVERROR(ENOENT)) |
|
break; |
|
if (err < 0) |
|
goto fail; |
|
|
|
// For generic image objects, the pitch is determined by the |
|
// implementation. |
|
image_desc.image_row_pitch = 0; |
|
|
|
image = clCreateImage(hwctx->context, CL_MEM_READ_WRITE, |
|
&image_format, &image_desc, NULL, &cle); |
|
if (!image) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to create image for " |
|
"plane %d: %d.\n", p, cle); |
|
goto fail; |
|
} |
|
|
|
desc->planes[p] = image; |
|
} |
|
|
|
desc->nb_planes = p; |
|
|
|
ref = av_buffer_create((uint8_t*)desc, sizeof(*desc), |
|
&opencl_pool_free, hwfc, 0); |
|
if (!ref) |
|
goto fail; |
|
|
|
return ref; |
|
|
|
fail: |
|
for (p = 0; desc->planes[p]; p++) |
|
clReleaseMemObject(desc->planes[p]); |
|
av_free(desc); |
|
return NULL; |
|
} |
|
|
|
static int opencl_frames_init_command_queue(AVHWFramesContext *hwfc) |
|
{ |
|
AVOpenCLFramesContext *hwctx = hwfc->hwctx; |
|
OpenCLDeviceContext *devpriv = hwfc->device_ctx->internal->priv; |
|
OpenCLFramesContext *priv = hwfc->internal->priv; |
|
cl_int cle; |
|
|
|
priv->command_queue = hwctx->command_queue ? hwctx->command_queue |
|
: devpriv->command_queue; |
|
cle = clRetainCommandQueue(priv->command_queue); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to retain frame " |
|
"command queue: %d.\n", cle); |
|
return AVERROR(EIO); |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int opencl_frames_init(AVHWFramesContext *hwfc) |
|
{ |
|
if (!hwfc->pool) { |
|
hwfc->internal->pool_internal = |
|
av_buffer_pool_init2(sizeof(cl_mem), hwfc, |
|
&opencl_pool_alloc, NULL); |
|
if (!hwfc->internal->pool_internal) |
|
return AVERROR(ENOMEM); |
|
} |
|
|
|
return opencl_frames_init_command_queue(hwfc); |
|
} |
|
|
|
static void opencl_frames_uninit(AVHWFramesContext *hwfc) |
|
{ |
|
OpenCLFramesContext *priv = hwfc->internal->priv; |
|
cl_int cle; |
|
|
|
#if HAVE_OPENCL_DXVA2 || HAVE_OPENCL_D3D11 |
|
int i, p; |
|
for (i = 0; i < priv->nb_mapped_frames; i++) { |
|
AVOpenCLFrameDescriptor *desc = &priv->mapped_frames[i]; |
|
for (p = 0; p < desc->nb_planes; p++) { |
|
cle = clReleaseMemObject(desc->planes[p]); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to release mapped " |
|
"frame object (frame %d plane %d): %d.\n", |
|
i, p, cle); |
|
} |
|
} |
|
} |
|
av_freep(&priv->mapped_frames); |
|
#endif |
|
|
|
if (priv->command_queue) { |
|
cle = clReleaseCommandQueue(priv->command_queue); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to release frame " |
|
"command queue: %d.\n", cle); |
|
} |
|
priv->command_queue = NULL; |
|
} |
|
} |
|
|
|
static int opencl_get_buffer(AVHWFramesContext *hwfc, AVFrame *frame) |
|
{ |
|
AVOpenCLFrameDescriptor *desc; |
|
int p; |
|
|
|
frame->buf[0] = av_buffer_pool_get(hwfc->pool); |
|
if (!frame->buf[0]) |
|
return AVERROR(ENOMEM); |
|
|
|
desc = (AVOpenCLFrameDescriptor*)frame->buf[0]->data; |
|
|
|
for (p = 0; p < desc->nb_planes; p++) |
|
frame->data[p] = (uint8_t*)desc->planes[p]; |
|
|
|
frame->format = AV_PIX_FMT_OPENCL; |
|
frame->width = hwfc->width; |
|
frame->height = hwfc->height; |
|
|
|
return 0; |
|
} |
|
|
|
static int opencl_transfer_get_formats(AVHWFramesContext *hwfc, |
|
enum AVHWFrameTransferDirection dir, |
|
enum AVPixelFormat **formats) |
|
{ |
|
enum AVPixelFormat *fmts; |
|
|
|
fmts = av_malloc_array(2, sizeof(*fmts)); |
|
if (!fmts) |
|
return AVERROR(ENOMEM); |
|
|
|
fmts[0] = hwfc->sw_format; |
|
fmts[1] = AV_PIX_FMT_NONE; |
|
|
|
*formats = fmts; |
|
return 0; |
|
} |
|
|
|
static int opencl_wait_events(AVHWFramesContext *hwfc, |
|
cl_event *events, int nb_events) |
|
{ |
|
cl_int cle; |
|
int i; |
|
|
|
cle = clWaitForEvents(nb_events, events); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to wait for event " |
|
"completion: %d.\n", cle); |
|
return AVERROR(EIO); |
|
} |
|
|
|
for (i = 0; i < nb_events; i++) { |
|
cle = clReleaseEvent(events[i]); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to release " |
|
"event: %d.\n", cle); |
|
} |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int opencl_transfer_data_from(AVHWFramesContext *hwfc, |
|
AVFrame *dst, const AVFrame *src) |
|
{ |
|
OpenCLFramesContext *priv = hwfc->internal->priv; |
|
cl_image_format image_format; |
|
cl_image_desc image_desc; |
|
cl_int cle; |
|
size_t origin[3] = { 0, 0, 0 }; |
|
size_t region[3]; |
|
cl_event events[AV_NUM_DATA_POINTERS]; |
|
int err, p; |
|
|
|
if (dst->format != hwfc->sw_format) |
|
return AVERROR(EINVAL); |
|
|
|
for (p = 0;; p++) { |
|
err = opencl_get_plane_format(hwfc->sw_format, p, |
|
src->width, src->height, |
|
&image_format, &image_desc); |
|
if (err < 0) { |
|
if (err == AVERROR(ENOENT)) |
|
err = 0; |
|
break; |
|
} |
|
|
|
if (!dst->data[p]) { |
|
av_log(hwfc, AV_LOG_ERROR, "Plane %d missing on " |
|
"destination frame for transfer.\n", p); |
|
err = AVERROR(EINVAL); |
|
break; |
|
} |
|
|
|
region[0] = image_desc.image_width; |
|
region[1] = image_desc.image_height; |
|
region[2] = 1; |
|
|
|
cle = clEnqueueReadImage(priv->command_queue, |
|
(cl_mem)src->data[p], |
|
CL_FALSE, origin, region, |
|
dst->linesize[p], 0, |
|
dst->data[p], |
|
0, NULL, &events[p]); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to enqueue read of " |
|
"OpenCL image plane %d: %d.\n", p, cle); |
|
err = AVERROR(EIO); |
|
break; |
|
} |
|
} |
|
|
|
opencl_wait_events(hwfc, events, p); |
|
|
|
return err; |
|
} |
|
|
|
static int opencl_transfer_data_to(AVHWFramesContext *hwfc, |
|
AVFrame *dst, const AVFrame *src) |
|
{ |
|
OpenCLFramesContext *priv = hwfc->internal->priv; |
|
cl_image_format image_format; |
|
cl_image_desc image_desc; |
|
cl_int cle; |
|
size_t origin[3] = { 0, 0, 0 }; |
|
size_t region[3]; |
|
cl_event events[AV_NUM_DATA_POINTERS]; |
|
int err, p; |
|
|
|
if (src->format != hwfc->sw_format) |
|
return AVERROR(EINVAL); |
|
|
|
for (p = 0;; p++) { |
|
err = opencl_get_plane_format(hwfc->sw_format, p, |
|
src->width, src->height, |
|
&image_format, &image_desc); |
|
if (err < 0) { |
|
if (err == AVERROR(ENOENT)) |
|
err = 0; |
|
break; |
|
} |
|
|
|
if (!src->data[p]) { |
|
av_log(hwfc, AV_LOG_ERROR, "Plane %d missing on " |
|
"source frame for transfer.\n", p); |
|
err = AVERROR(EINVAL); |
|
break; |
|
} |
|
|
|
region[0] = image_desc.image_width; |
|
region[1] = image_desc.image_height; |
|
region[2] = 1; |
|
|
|
cle = clEnqueueWriteImage(priv->command_queue, |
|
(cl_mem)dst->data[p], |
|
CL_FALSE, origin, region, |
|
src->linesize[p], 0, |
|
src->data[p], |
|
0, NULL, &events[p]); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to enqueue write of " |
|
"OpenCL image plane %d: %d.\n", p, cle); |
|
err = AVERROR(EIO); |
|
break; |
|
} |
|
} |
|
|
|
opencl_wait_events(hwfc, events, p); |
|
|
|
return err; |
|
} |
|
|
|
typedef struct OpenCLMapping { |
|
// The mapped addresses for each plane. |
|
// The destination frame is not available when we unmap, so these |
|
// need to be stored separately. |
|
void *address[AV_NUM_DATA_POINTERS]; |
|
} OpenCLMapping; |
|
|
|
static void opencl_unmap_frame(AVHWFramesContext *hwfc, |
|
HWMapDescriptor *hwmap) |
|
{ |
|
OpenCLFramesContext *priv = hwfc->internal->priv; |
|
OpenCLMapping *map = hwmap->priv; |
|
cl_event events[AV_NUM_DATA_POINTERS]; |
|
int p, e; |
|
cl_int cle; |
|
|
|
for (p = e = 0; p < FF_ARRAY_ELEMS(map->address); p++) { |
|
if (!map->address[p]) |
|
break; |
|
|
|
cle = clEnqueueUnmapMemObject(priv->command_queue, |
|
(cl_mem)hwmap->source->data[p], |
|
map->address[p], |
|
0, NULL, &events[e]); |
|
if (cle != CL_SUCCESS) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to unmap OpenCL " |
|
"image plane %d: %d.\n", p, cle); |
|
} |
|
++e; |
|
} |
|
|
|
opencl_wait_events(hwfc, events, e); |
|
|
|
av_free(map); |
|
} |
|
|
|
static int opencl_map_frame(AVHWFramesContext *hwfc, AVFrame *dst, |
|
const AVFrame *src, int flags) |
|
{ |
|
OpenCLFramesContext *priv = hwfc->internal->priv; |
|
cl_map_flags map_flags; |
|
cl_image_format image_format; |
|
cl_image_desc image_desc; |
|
cl_int cle; |
|
OpenCLMapping *map; |
|
size_t origin[3] = { 0, 0, 0 }; |
|
size_t region[3]; |
|
size_t row_pitch; |
|
cl_event events[AV_NUM_DATA_POINTERS]; |
|
int err, p; |
|
|
|
av_assert0(hwfc->sw_format == dst->format); |
|
|
|
if (flags & AV_HWFRAME_MAP_OVERWRITE && |
|
!(flags & AV_HWFRAME_MAP_READ)) { |
|
// This is mutually exclusive with the read/write flags, so |
|
// there is no way to map with read here. |
|
map_flags = CL_MAP_WRITE_INVALIDATE_REGION; |
|
} else { |
|
map_flags = 0; |
|
if (flags & AV_HWFRAME_MAP_READ) |
|
map_flags |= CL_MAP_READ; |
|
if (flags & AV_HWFRAME_MAP_WRITE) |
|
map_flags |= CL_MAP_WRITE; |
|
} |
|
|
|
map = av_mallocz(sizeof(*map)); |
|
if (!map) |
|
return AVERROR(ENOMEM); |
|
|
|
for (p = 0;; p++) { |
|
err = opencl_get_plane_format(hwfc->sw_format, p, |
|
src->width, src->height, |
|
&image_format, &image_desc); |
|
if (err == AVERROR(ENOENT)) |
|
break; |
|
if (err < 0) |
|
goto fail; |
|
|
|
region[0] = image_desc.image_width; |
|
region[1] = image_desc.image_height; |
|
region[2] = 1; |
|
|
|
map->address[p] = |
|
clEnqueueMapImage(priv->command_queue, |
|
(cl_mem)src->data[p], |
|
CL_FALSE, map_flags, origin, region, |
|
&row_pitch, NULL, 0, NULL, |
|
&events[p], &cle); |
|
if (!map->address[p]) { |
|
av_log(hwfc, AV_LOG_ERROR, "Failed to map OpenCL " |
|
"image plane %d: %d.\n", p, cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
|
|
dst->data[p] = map->address[p]; |
|
|
|
av_log(hwfc, AV_LOG_DEBUG, "Map plane %d (%p -> %p).\n", |
|
p, src->data[p], dst->data[p]); |
|
} |
|
|
|
err = opencl_wait_events(hwfc, events, p); |
|
if (err < 0) |
|
goto fail; |
|
|
|
err = ff_hwframe_map_create(src->hw_frames_ctx, dst, src, |
|
&opencl_unmap_frame, map); |
|
if (err < 0) |
|
goto fail; |
|
|
|
dst->width = src->width; |
|
dst->height = src->height; |
|
|
|
return 0; |
|
|
|
fail: |
|
for (p = 0; p < AV_NUM_DATA_POINTERS; p++) { |
|
if (!map->address[p]) |
|
break; |
|
clEnqueueUnmapMemObject(priv->command_queue, |
|
(cl_mem)src->data[p], |
|
map->address[p], |
|
0, NULL, &events[p]); |
|
} |
|
if (p > 0) |
|
opencl_wait_events(hwfc, events, p); |
|
av_freep(&map); |
|
return err; |
|
} |
|
|
|
#if HAVE_OPENCL_DRM_BEIGNET |
|
|
|
typedef struct DRMBeignetToOpenCLMapping { |
|
AVFrame *drm_frame; |
|
AVDRMFrameDescriptor *drm_desc; |
|
|
|
AVOpenCLFrameDescriptor frame; |
|
} DRMBeignetToOpenCLMapping; |
|
|
|
static void opencl_unmap_from_drm_beignet(AVHWFramesContext *dst_fc, |
|
HWMapDescriptor *hwmap) |
|
{ |
|
DRMBeignetToOpenCLMapping *mapping = hwmap->priv; |
|
cl_int cle; |
|
int i; |
|
|
|
for (i = 0; i < mapping->frame.nb_planes; i++) { |
|
cle = clReleaseMemObject(mapping->frame.planes[i]); |
|
if (cle != CL_SUCCESS) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to release CL image " |
|
"of plane %d of DRM frame: %d.\n", i, cle); |
|
} |
|
} |
|
|
|
av_free(mapping); |
|
} |
|
|
|
static int opencl_map_from_drm_beignet(AVHWFramesContext *dst_fc, |
|
AVFrame *dst, const AVFrame *src, |
|
int flags) |
|
{ |
|
AVOpenCLDeviceContext *hwctx = dst_fc->device_ctx->hwctx; |
|
OpenCLDeviceContext *priv = dst_fc->device_ctx->internal->priv; |
|
DRMBeignetToOpenCLMapping *mapping; |
|
const AVDRMFrameDescriptor *desc; |
|
cl_int cle; |
|
int err, i, j, p; |
|
|
|
desc = (const AVDRMFrameDescriptor*)src->data[0]; |
|
|
|
mapping = av_mallocz(sizeof(*mapping)); |
|
if (!mapping) |
|
return AVERROR(ENOMEM); |
|
|
|
p = 0; |
|
for (i = 0; i < desc->nb_layers; i++) { |
|
const AVDRMLayerDescriptor *layer = &desc->layers[i]; |
|
for (j = 0; j < layer->nb_planes; j++) { |
|
const AVDRMPlaneDescriptor *plane = &layer->planes[j]; |
|
const AVDRMObjectDescriptor *object = |
|
&desc->objects[plane->object_index]; |
|
|
|
cl_import_image_info_intel image_info = { |
|
.fd = object->fd, |
|
.size = object->size, |
|
.type = CL_MEM_OBJECT_IMAGE2D, |
|
.offset = plane->offset, |
|
.row_pitch = plane->pitch, |
|
}; |
|
cl_image_desc image_desc; |
|
|
|
err = opencl_get_plane_format(dst_fc->sw_format, p, |
|
src->width, src->height, |
|
&image_info.fmt, |
|
&image_desc); |
|
if (err < 0) { |
|
av_log(dst_fc, AV_LOG_ERROR, "DRM frame layer %d " |
|
"plane %d is not representable in OpenCL: %d.\n", |
|
i, j, err); |
|
goto fail; |
|
} |
|
image_info.width = image_desc.image_width; |
|
image_info.height = image_desc.image_height; |
|
|
|
mapping->frame.planes[p] = |
|
priv->clCreateImageFromFdINTEL(hwctx->context, |
|
&image_info, &cle); |
|
if (!mapping->frame.planes[p]) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL image " |
|
"from layer %d plane %d of DRM frame: %d.\n", |
|
i, j, cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
|
|
dst->data[p] = (uint8_t*)mapping->frame.planes[p]; |
|
mapping->frame.nb_planes = ++p; |
|
} |
|
} |
|
|
|
err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
|
&opencl_unmap_from_drm_beignet, |
|
mapping); |
|
if (err < 0) |
|
goto fail; |
|
|
|
dst->width = src->width; |
|
dst->height = src->height; |
|
|
|
return 0; |
|
|
|
fail: |
|
for (p = 0; p < mapping->frame.nb_planes; p++) { |
|
if (mapping->frame.planes[p]) |
|
clReleaseMemObject(mapping->frame.planes[p]); |
|
} |
|
av_free(mapping); |
|
return err; |
|
} |
|
|
|
#if HAVE_OPENCL_VAAPI_BEIGNET |
|
|
|
static int opencl_map_from_vaapi(AVHWFramesContext *dst_fc, |
|
AVFrame *dst, const AVFrame *src, |
|
int flags) |
|
{ |
|
AVFrame *tmp; |
|
int err; |
|
|
|
tmp = av_frame_alloc(); |
|
if (!tmp) |
|
return AVERROR(ENOMEM); |
|
|
|
tmp->format = AV_PIX_FMT_DRM_PRIME; |
|
|
|
err = av_hwframe_map(tmp, src, flags); |
|
if (err < 0) |
|
goto fail; |
|
|
|
err = opencl_map_from_drm_beignet(dst_fc, dst, tmp, flags); |
|
if (err < 0) |
|
goto fail; |
|
|
|
err = ff_hwframe_map_replace(dst, src); |
|
|
|
fail: |
|
av_frame_free(&tmp); |
|
return err; |
|
} |
|
|
|
#endif /* HAVE_OPENCL_VAAPI_BEIGNET */ |
|
#endif /* HAVE_OPENCL_DRM_BEIGNET */ |
|
|
|
static inline cl_mem_flags opencl_mem_flags_for_mapping(int map_flags) |
|
{ |
|
if ((map_flags & AV_HWFRAME_MAP_READ) && |
|
(map_flags & AV_HWFRAME_MAP_WRITE)) |
|
return CL_MEM_READ_WRITE; |
|
else if (map_flags & AV_HWFRAME_MAP_READ) |
|
return CL_MEM_READ_ONLY; |
|
else if (map_flags & AV_HWFRAME_MAP_WRITE) |
|
return CL_MEM_WRITE_ONLY; |
|
else |
|
return 0; |
|
} |
|
|
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
|
|
|
static void opencl_unmap_from_qsv(AVHWFramesContext *dst_fc, |
|
HWMapDescriptor *hwmap) |
|
{ |
|
AVOpenCLFrameDescriptor *desc = hwmap->priv; |
|
OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
|
OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
|
cl_event event; |
|
cl_int cle; |
|
int p; |
|
|
|
av_log(dst_fc, AV_LOG_DEBUG, "Unmap QSV/VAAPI surface from OpenCL.\n"); |
|
|
|
cle = device_priv->clEnqueueReleaseVA_APIMediaSurfacesINTEL( |
|
frames_priv->command_queue, desc->nb_planes, desc->planes, |
|
0, NULL, &event); |
|
if (cle != CL_SUCCESS) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to release surface " |
|
"handles: %d.\n", cle); |
|
} |
|
|
|
opencl_wait_events(dst_fc, &event, 1); |
|
|
|
for (p = 0; p < desc->nb_planes; p++) { |
|
cle = clReleaseMemObject(desc->planes[p]); |
|
if (cle != CL_SUCCESS) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to release CL " |
|
"image of plane %d of QSV/VAAPI surface: %d\n", |
|
p, cle); |
|
} |
|
} |
|
|
|
av_free(desc); |
|
} |
|
|
|
static int opencl_map_from_qsv(AVHWFramesContext *dst_fc, AVFrame *dst, |
|
const AVFrame *src, int flags) |
|
{ |
|
AVHWFramesContext *src_fc = |
|
(AVHWFramesContext*)src->hw_frames_ctx->data; |
|
AVOpenCLDeviceContext *dst_dev = dst_fc->device_ctx->hwctx; |
|
OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
|
OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
|
AVOpenCLFrameDescriptor *desc; |
|
VASurfaceID va_surface; |
|
cl_mem_flags cl_flags; |
|
cl_event event; |
|
cl_int cle; |
|
int err, p; |
|
|
|
#if CONFIG_LIBMFX |
|
if (src->format == AV_PIX_FMT_QSV) { |
|
void *base_handle; |
|
mfxFrameSurface1 *mfx_surface = (mfxFrameSurface1*)src->data[3]; |
|
err = ff_qsv_get_surface_base_handle(mfx_surface, |
|
AV_HWDEVICE_TYPE_VAAPI, |
|
&base_handle); |
|
if (err < 0) |
|
return err; |
|
va_surface = *(VASurfaceID *)base_handle; |
|
} else |
|
#endif |
|
if (src->format == AV_PIX_FMT_VAAPI) { |
|
va_surface = (VASurfaceID)(uintptr_t)src->data[3]; |
|
} else { |
|
return AVERROR(ENOSYS); |
|
} |
|
|
|
cl_flags = opencl_mem_flags_for_mapping(flags); |
|
if (!cl_flags) |
|
return AVERROR(EINVAL); |
|
|
|
av_log(src_fc, AV_LOG_DEBUG, "Map QSV/VAAPI surface %#x to " |
|
"OpenCL.\n", va_surface); |
|
|
|
desc = av_mallocz(sizeof(*desc)); |
|
if (!desc) |
|
return AVERROR(ENOMEM); |
|
|
|
// The cl_intel_va_api_media_sharing extension only supports NV12 |
|
// surfaces, so for now there are always exactly two planes. |
|
desc->nb_planes = 2; |
|
|
|
for (p = 0; p < desc->nb_planes; p++) { |
|
desc->planes[p] = |
|
device_priv->clCreateFromVA_APIMediaSurfaceINTEL( |
|
dst_dev->context, cl_flags, &va_surface, p, &cle); |
|
if (!desc->planes[p]) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL " |
|
"image from plane %d of QSV/VAAPI surface " |
|
"%#x: %d.\n", p, va_surface, cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
|
|
dst->data[p] = (uint8_t*)desc->planes[p]; |
|
} |
|
|
|
cle = device_priv->clEnqueueAcquireVA_APIMediaSurfacesINTEL( |
|
frames_priv->command_queue, desc->nb_planes, desc->planes, |
|
0, NULL, &event); |
|
if (cle != CL_SUCCESS) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to acquire surface " |
|
"handles: %d.\n", cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
|
|
err = opencl_wait_events(dst_fc, &event, 1); |
|
if (err < 0) |
|
goto fail; |
|
|
|
err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
|
&opencl_unmap_from_qsv, desc); |
|
if (err < 0) |
|
goto fail; |
|
|
|
dst->width = src->width; |
|
dst->height = src->height; |
|
|
|
return 0; |
|
|
|
fail: |
|
for (p = 0; p < desc->nb_planes; p++) |
|
if (desc->planes[p]) |
|
clReleaseMemObject(desc->planes[p]); |
|
av_freep(&desc); |
|
return err; |
|
} |
|
|
|
#endif |
|
|
|
#if HAVE_OPENCL_DXVA2 |
|
|
|
static void opencl_unmap_from_dxva2(AVHWFramesContext *dst_fc, |
|
HWMapDescriptor *hwmap) |
|
{ |
|
AVOpenCLFrameDescriptor *desc = hwmap->priv; |
|
OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
|
OpenCLFramesContext *frames_priv = dst_fc->device_ctx->internal->priv; |
|
cl_event event; |
|
cl_int cle; |
|
|
|
av_log(dst_fc, AV_LOG_DEBUG, "Unmap DXVA2 surface from OpenCL.\n"); |
|
|
|
cle = device_priv->clEnqueueReleaseDX9MediaSurfacesKHR( |
|
frames_priv->command_queue, desc->nb_planes, desc->planes, |
|
0, NULL, &event); |
|
if (cle != CL_SUCCESS) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to release surface " |
|
"handle: %d.\n", cle); |
|
return; |
|
} |
|
|
|
opencl_wait_events(dst_fc, &event, 1); |
|
} |
|
|
|
static int opencl_map_from_dxva2(AVHWFramesContext *dst_fc, AVFrame *dst, |
|
const AVFrame *src, int flags) |
|
{ |
|
AVHWFramesContext *src_fc = |
|
(AVHWFramesContext*)src->hw_frames_ctx->data; |
|
AVDXVA2FramesContext *src_hwctx = src_fc->hwctx; |
|
OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
|
OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
|
AVOpenCLFrameDescriptor *desc; |
|
cl_event event; |
|
cl_int cle; |
|
int err, i; |
|
|
|
av_log(dst_fc, AV_LOG_DEBUG, "Map DXVA2 surface %p to " |
|
"OpenCL.\n", src->data[3]); |
|
|
|
for (i = 0; i < src_hwctx->nb_surfaces; i++) { |
|
if (src_hwctx->surfaces[i] == (IDirect3DSurface9*)src->data[3]) |
|
break; |
|
} |
|
if (i >= src_hwctx->nb_surfaces) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Trying to map from a surface which " |
|
"is not in the mapped frames context.\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
desc = &frames_priv->mapped_frames[i]; |
|
|
|
cle = device_priv->clEnqueueAcquireDX9MediaSurfacesKHR( |
|
frames_priv->command_queue, desc->nb_planes, desc->planes, |
|
0, NULL, &event); |
|
if (cle != CL_SUCCESS) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to acquire surface " |
|
"handle: %d.\n", cle); |
|
return AVERROR(EIO); |
|
} |
|
|
|
err = opencl_wait_events(dst_fc, &event, 1); |
|
if (err < 0) |
|
goto fail; |
|
|
|
for (i = 0; i < desc->nb_planes; i++) |
|
dst->data[i] = (uint8_t*)desc->planes[i]; |
|
|
|
err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
|
&opencl_unmap_from_dxva2, desc); |
|
if (err < 0) |
|
goto fail; |
|
|
|
dst->width = src->width; |
|
dst->height = src->height; |
|
|
|
return 0; |
|
|
|
fail: |
|
cle = device_priv->clEnqueueReleaseDX9MediaSurfacesKHR( |
|
frames_priv->command_queue, desc->nb_planes, desc->planes, |
|
0, NULL, &event); |
|
if (cle == CL_SUCCESS) |
|
opencl_wait_events(dst_fc, &event, 1); |
|
return err; |
|
} |
|
|
|
static int opencl_frames_derive_from_dxva2(AVHWFramesContext *dst_fc, |
|
AVHWFramesContext *src_fc, int flags) |
|
{ |
|
AVOpenCLDeviceContext *dst_dev = dst_fc->device_ctx->hwctx; |
|
AVDXVA2FramesContext *src_hwctx = src_fc->hwctx; |
|
OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
|
OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
|
cl_mem_flags cl_flags; |
|
cl_int cle; |
|
int err, i, p, nb_planes; |
|
|
|
if (src_fc->sw_format != AV_PIX_FMT_NV12) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Only NV12 textures are supported " |
|
"for DXVA2 to OpenCL mapping.\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
nb_planes = 2; |
|
|
|
if (src_fc->initial_pool_size == 0) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Only fixed-size pools are supported " |
|
"for DXVA2 to OpenCL mapping.\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
cl_flags = opencl_mem_flags_for_mapping(flags); |
|
if (!cl_flags) |
|
return AVERROR(EINVAL); |
|
|
|
frames_priv->nb_mapped_frames = src_hwctx->nb_surfaces; |
|
|
|
frames_priv->mapped_frames = |
|
av_calloc(frames_priv->nb_mapped_frames, |
|
sizeof(*frames_priv->mapped_frames)); |
|
if (!frames_priv->mapped_frames) |
|
return AVERROR(ENOMEM); |
|
|
|
for (i = 0; i < frames_priv->nb_mapped_frames; i++) { |
|
AVOpenCLFrameDescriptor *desc = &frames_priv->mapped_frames[i]; |
|
cl_dx9_surface_info_khr surface_info = { |
|
.resource = src_hwctx->surfaces[i], |
|
.shared_handle = NULL, |
|
}; |
|
desc->nb_planes = nb_planes; |
|
for (p = 0; p < nb_planes; p++) { |
|
desc->planes[p] = |
|
device_priv->clCreateFromDX9MediaSurfaceKHR( |
|
dst_dev->context, cl_flags, |
|
device_priv->dx9_media_adapter_type, |
|
&surface_info, p, &cle); |
|
if (!desc->planes[p]) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL " |
|
"image from plane %d of DXVA2 surface %d: %d.\n", |
|
p, i, cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
} |
|
} |
|
|
|
return 0; |
|
|
|
fail: |
|
for (i = 0; i < frames_priv->nb_mapped_frames; i++) { |
|
AVOpenCLFrameDescriptor *desc = &frames_priv->mapped_frames[i]; |
|
for (p = 0; p < desc->nb_planes; p++) { |
|
if (desc->planes[p]) |
|
clReleaseMemObject(desc->planes[p]); |
|
} |
|
} |
|
av_freep(&frames_priv->mapped_frames); |
|
frames_priv->nb_mapped_frames = 0; |
|
return err; |
|
} |
|
|
|
#endif |
|
|
|
#if HAVE_OPENCL_D3D11 |
|
|
|
static void opencl_unmap_from_d3d11(AVHWFramesContext *dst_fc, |
|
HWMapDescriptor *hwmap) |
|
{ |
|
AVOpenCLFrameDescriptor *desc = hwmap->priv; |
|
OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
|
OpenCLFramesContext *frames_priv = dst_fc->device_ctx->internal->priv; |
|
cl_event event; |
|
cl_int cle; |
|
|
|
cle = device_priv->clEnqueueReleaseD3D11ObjectsKHR( |
|
frames_priv->command_queue, desc->nb_planes, desc->planes, |
|
0, NULL, &event); |
|
if (cle != CL_SUCCESS) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to release surface " |
|
"handle: %d.\n", cle); |
|
} |
|
|
|
opencl_wait_events(dst_fc, &event, 1); |
|
} |
|
|
|
static int opencl_map_from_d3d11(AVHWFramesContext *dst_fc, AVFrame *dst, |
|
const AVFrame *src, int flags) |
|
{ |
|
OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
|
OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
|
AVOpenCLFrameDescriptor *desc; |
|
cl_event event; |
|
cl_int cle; |
|
int err, index, i; |
|
|
|
index = (intptr_t)src->data[1]; |
|
if (index >= frames_priv->nb_mapped_frames) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Texture array index out of range for " |
|
"mapping: %d >= %d.\n", index, frames_priv->nb_mapped_frames); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
av_log(dst_fc, AV_LOG_DEBUG, "Map D3D11 texture %d to OpenCL.\n", |
|
index); |
|
|
|
desc = &frames_priv->mapped_frames[index]; |
|
|
|
cle = device_priv->clEnqueueAcquireD3D11ObjectsKHR( |
|
frames_priv->command_queue, desc->nb_planes, desc->planes, |
|
0, NULL, &event); |
|
if (cle != CL_SUCCESS) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to acquire surface " |
|
"handle: %d.\n", cle); |
|
return AVERROR(EIO); |
|
} |
|
|
|
err = opencl_wait_events(dst_fc, &event, 1); |
|
if (err < 0) |
|
goto fail; |
|
|
|
for (i = 0; i < desc->nb_planes; i++) |
|
dst->data[i] = (uint8_t*)desc->planes[i]; |
|
|
|
err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
|
&opencl_unmap_from_d3d11, desc); |
|
if (err < 0) |
|
goto fail; |
|
|
|
dst->width = src->width; |
|
dst->height = src->height; |
|
|
|
return 0; |
|
|
|
fail: |
|
cle = device_priv->clEnqueueReleaseD3D11ObjectsKHR( |
|
frames_priv->command_queue, desc->nb_planes, desc->planes, |
|
0, NULL, &event); |
|
if (cle == CL_SUCCESS) |
|
opencl_wait_events(dst_fc, &event, 1); |
|
return err; |
|
} |
|
|
|
static int opencl_frames_derive_from_d3d11(AVHWFramesContext *dst_fc, |
|
AVHWFramesContext *src_fc, int flags) |
|
{ |
|
AVOpenCLDeviceContext *dst_dev = dst_fc->device_ctx->hwctx; |
|
AVD3D11VAFramesContext *src_hwctx = src_fc->hwctx; |
|
OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
|
OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
|
cl_mem_flags cl_flags; |
|
cl_int cle; |
|
int err, i, p, nb_planes; |
|
|
|
if (src_fc->sw_format != AV_PIX_FMT_NV12) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Only NV12 textures are supported " |
|
"for D3D11 to OpenCL mapping.\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
nb_planes = 2; |
|
|
|
if (src_fc->initial_pool_size == 0) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Only fixed-size pools are supported " |
|
"for D3D11 to OpenCL mapping.\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
cl_flags = opencl_mem_flags_for_mapping(flags); |
|
if (!cl_flags) |
|
return AVERROR(EINVAL); |
|
|
|
frames_priv->nb_mapped_frames = src_fc->initial_pool_size; |
|
|
|
frames_priv->mapped_frames = |
|
av_calloc(frames_priv->nb_mapped_frames, |
|
sizeof(*frames_priv->mapped_frames)); |
|
if (!frames_priv->mapped_frames) |
|
return AVERROR(ENOMEM); |
|
|
|
for (i = 0; i < frames_priv->nb_mapped_frames; i++) { |
|
AVOpenCLFrameDescriptor *desc = &frames_priv->mapped_frames[i]; |
|
desc->nb_planes = nb_planes; |
|
for (p = 0; p < nb_planes; p++) { |
|
UINT subresource = 2 * i + p; |
|
|
|
desc->planes[p] = |
|
device_priv->clCreateFromD3D11Texture2DKHR( |
|
dst_dev->context, cl_flags, src_hwctx->texture, |
|
subresource, &cle); |
|
if (!desc->planes[p]) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL " |
|
"image from plane %d of D3D texture " |
|
"index %d (subresource %u): %d.\n", |
|
p, i, (unsigned int)subresource, cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
} |
|
} |
|
|
|
return 0; |
|
|
|
fail: |
|
for (i = 0; i < frames_priv->nb_mapped_frames; i++) { |
|
AVOpenCLFrameDescriptor *desc = &frames_priv->mapped_frames[i]; |
|
for (p = 0; p < desc->nb_planes; p++) { |
|
if (desc->planes[p]) |
|
clReleaseMemObject(desc->planes[p]); |
|
} |
|
} |
|
av_freep(&frames_priv->mapped_frames); |
|
frames_priv->nb_mapped_frames = 0; |
|
return err; |
|
} |
|
|
|
#endif |
|
|
|
#if HAVE_OPENCL_DRM_ARM |
|
|
|
typedef struct DRMARMtoOpenCLMapping { |
|
int nb_objects; |
|
cl_mem object_buffers[AV_DRM_MAX_PLANES]; |
|
int nb_planes; |
|
cl_mem plane_images[AV_DRM_MAX_PLANES]; |
|
} DRMARMtoOpenCLMapping; |
|
|
|
static void opencl_unmap_from_drm_arm(AVHWFramesContext *dst_fc, |
|
HWMapDescriptor *hwmap) |
|
{ |
|
DRMARMtoOpenCLMapping *mapping = hwmap->priv; |
|
int i; |
|
|
|
for (i = 0; i < mapping->nb_planes; i++) |
|
clReleaseMemObject(mapping->plane_images[i]); |
|
|
|
for (i = 0; i < mapping->nb_objects; i++) |
|
clReleaseMemObject(mapping->object_buffers[i]); |
|
|
|
av_free(mapping); |
|
} |
|
|
|
static int opencl_map_from_drm_arm(AVHWFramesContext *dst_fc, AVFrame *dst, |
|
const AVFrame *src, int flags) |
|
{ |
|
AVHWFramesContext *src_fc = |
|
(AVHWFramesContext*)src->hw_frames_ctx->data; |
|
AVOpenCLDeviceContext *dst_dev = dst_fc->device_ctx->hwctx; |
|
const AVDRMFrameDescriptor *desc; |
|
DRMARMtoOpenCLMapping *mapping = NULL; |
|
cl_mem_flags cl_flags; |
|
const cl_import_properties_arm props[3] = { |
|
CL_IMPORT_TYPE_ARM, CL_IMPORT_TYPE_DMA_BUF_ARM, 0, |
|
}; |
|
cl_int cle; |
|
int err, i, j; |
|
|
|
desc = (const AVDRMFrameDescriptor*)src->data[0]; |
|
|
|
cl_flags = opencl_mem_flags_for_mapping(flags); |
|
if (!cl_flags) |
|
return AVERROR(EINVAL); |
|
|
|
mapping = av_mallocz(sizeof(*mapping)); |
|
if (!mapping) |
|
return AVERROR(ENOMEM); |
|
|
|
mapping->nb_objects = desc->nb_objects; |
|
for (i = 0; i < desc->nb_objects; i++) { |
|
int fd = desc->objects[i].fd; |
|
|
|
av_log(dst_fc, AV_LOG_DEBUG, "Map DRM PRIME fd %d to OpenCL.\n", fd); |
|
|
|
if (desc->objects[i].format_modifier) { |
|
av_log(dst_fc, AV_LOG_DEBUG, "Warning: object %d fd %d has " |
|
"nonzero format modifier %"PRId64", result may not " |
|
"be as expected.\n", i, fd, |
|
desc->objects[i].format_modifier); |
|
} |
|
|
|
mapping->object_buffers[i] = |
|
clImportMemoryARM(dst_dev->context, cl_flags, props, |
|
&fd, desc->objects[i].size, &cle); |
|
if (!mapping->object_buffers[i]) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL buffer " |
|
"from object %d (fd %d, size %"SIZE_SPECIFIER") of DRM frame: %d.\n", |
|
i, fd, desc->objects[i].size, cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
} |
|
|
|
mapping->nb_planes = 0; |
|
for (i = 0; i < desc->nb_layers; i++) { |
|
const AVDRMLayerDescriptor *layer = &desc->layers[i]; |
|
|
|
for (j = 0; j < layer->nb_planes; j++) { |
|
const AVDRMPlaneDescriptor *plane = &layer->planes[j]; |
|
cl_mem plane_buffer; |
|
cl_image_format image_format; |
|
cl_image_desc image_desc; |
|
cl_buffer_region region; |
|
int p = mapping->nb_planes; |
|
|
|
err = opencl_get_plane_format(src_fc->sw_format, p, |
|
src_fc->width, src_fc->height, |
|
&image_format, &image_desc); |
|
if (err < 0) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Invalid plane %d (DRM " |
|
"layer %d plane %d): %d.\n", p, i, j, err); |
|
goto fail; |
|
} |
|
|
|
region.origin = plane->offset; |
|
region.size = image_desc.image_row_pitch * |
|
image_desc.image_height; |
|
|
|
plane_buffer = |
|
clCreateSubBuffer(mapping->object_buffers[plane->object_index], |
|
cl_flags, |
|
CL_BUFFER_CREATE_TYPE_REGION, |
|
®ion, &cle); |
|
if (!plane_buffer) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to create sub-buffer " |
|
"for plane %d: %d.\n", p, cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
|
|
image_desc.buffer = plane_buffer; |
|
|
|
mapping->plane_images[p] = |
|
clCreateImage(dst_dev->context, cl_flags, |
|
&image_format, &image_desc, NULL, &cle); |
|
|
|
// Unreference the sub-buffer immediately - we don't need it |
|
// directly and a reference is held by the image. |
|
clReleaseMemObject(plane_buffer); |
|
|
|
if (!mapping->plane_images[p]) { |
|
av_log(dst_fc, AV_LOG_ERROR, "Failed to create image " |
|
"for plane %d: %d.\n", p, cle); |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
|
|
++mapping->nb_planes; |
|
} |
|
} |
|
|
|
for (i = 0; i < mapping->nb_planes; i++) |
|
dst->data[i] = (uint8_t*)mapping->plane_images[i]; |
|
|
|
err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
|
&opencl_unmap_from_drm_arm, mapping); |
|
if (err < 0) |
|
goto fail; |
|
|
|
dst->width = src->width; |
|
dst->height = src->height; |
|
|
|
return 0; |
|
|
|
fail: |
|
for (i = 0; i < mapping->nb_planes; i++) { |
|
clReleaseMemObject(mapping->plane_images[i]); |
|
} |
|
for (i = 0; i < mapping->nb_objects; i++) { |
|
if (mapping->object_buffers[i]) |
|
clReleaseMemObject(mapping->object_buffers[i]); |
|
} |
|
av_free(mapping); |
|
return err; |
|
} |
|
|
|
#endif |
|
|
|
static int opencl_map_from(AVHWFramesContext *hwfc, AVFrame *dst, |
|
const AVFrame *src, int flags) |
|
{ |
|
av_assert0(src->format == AV_PIX_FMT_OPENCL); |
|
if (hwfc->sw_format != dst->format) |
|
return AVERROR(ENOSYS); |
|
return opencl_map_frame(hwfc, dst, src, flags); |
|
} |
|
|
|
static int opencl_map_to(AVHWFramesContext *hwfc, AVFrame *dst, |
|
const AVFrame *src, int flags) |
|
{ |
|
av_unused OpenCLDeviceContext *priv = hwfc->device_ctx->internal->priv; |
|
av_assert0(dst->format == AV_PIX_FMT_OPENCL); |
|
switch (src->format) { |
|
#if HAVE_OPENCL_DRM_BEIGNET |
|
case AV_PIX_FMT_DRM_PRIME: |
|
if (priv->beignet_drm_mapping_usable) |
|
return opencl_map_from_drm_beignet(hwfc, dst, src, flags); |
|
#endif |
|
#if HAVE_OPENCL_VAAPI_BEIGNET |
|
case AV_PIX_FMT_VAAPI: |
|
if (priv->beignet_drm_mapping_usable) |
|
return opencl_map_from_vaapi(hwfc, dst, src, flags); |
|
#endif |
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
|
case AV_PIX_FMT_QSV: |
|
case AV_PIX_FMT_VAAPI: |
|
if (priv->qsv_mapping_usable) |
|
return opencl_map_from_qsv(hwfc, dst, src, flags); |
|
#endif |
|
#if HAVE_OPENCL_DXVA2 |
|
case AV_PIX_FMT_DXVA2_VLD: |
|
if (priv->dxva2_mapping_usable) |
|
return opencl_map_from_dxva2(hwfc, dst, src, flags); |
|
#endif |
|
#if HAVE_OPENCL_D3D11 |
|
case AV_PIX_FMT_D3D11: |
|
if (priv->d3d11_mapping_usable) |
|
return opencl_map_from_d3d11(hwfc, dst, src, flags); |
|
#endif |
|
#if HAVE_OPENCL_DRM_ARM |
|
case AV_PIX_FMT_DRM_PRIME: |
|
if (priv->drm_arm_mapping_usable) |
|
return opencl_map_from_drm_arm(hwfc, dst, src, flags); |
|
#endif |
|
} |
|
return AVERROR(ENOSYS); |
|
} |
|
|
|
static int opencl_frames_derive_to(AVHWFramesContext *dst_fc, |
|
AVHWFramesContext *src_fc, int flags) |
|
{ |
|
av_unused OpenCLDeviceContext *priv = dst_fc->device_ctx->internal->priv; |
|
switch (src_fc->device_ctx->type) { |
|
#if HAVE_OPENCL_DRM_BEIGNET |
|
case AV_HWDEVICE_TYPE_DRM: |
|
if (!priv->beignet_drm_mapping_usable) |
|
return AVERROR(ENOSYS); |
|
break; |
|
#endif |
|
#if HAVE_OPENCL_VAAPI_BEIGNET |
|
case AV_HWDEVICE_TYPE_VAAPI: |
|
if (!priv->beignet_drm_mapping_usable) |
|
return AVERROR(ENOSYS); |
|
break; |
|
#endif |
|
#if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
|
case AV_HWDEVICE_TYPE_QSV: |
|
case AV_HWDEVICE_TYPE_VAAPI: |
|
if (!priv->qsv_mapping_usable) |
|
return AVERROR(ENOSYS); |
|
break; |
|
#endif |
|
#if HAVE_OPENCL_DXVA2 |
|
case AV_HWDEVICE_TYPE_DXVA2: |
|
if (!priv->dxva2_mapping_usable) |
|
return AVERROR(ENOSYS); |
|
{ |
|
int err; |
|
err = opencl_frames_derive_from_dxva2(dst_fc, src_fc, flags); |
|
if (err < 0) |
|
return err; |
|
} |
|
break; |
|
#endif |
|
#if HAVE_OPENCL_D3D11 |
|
case AV_HWDEVICE_TYPE_D3D11VA: |
|
if (!priv->d3d11_mapping_usable) |
|
return AVERROR(ENOSYS); |
|
{ |
|
int err; |
|
err = opencl_frames_derive_from_d3d11(dst_fc, src_fc, flags); |
|
if (err < 0) |
|
return err; |
|
} |
|
break; |
|
#endif |
|
#if HAVE_OPENCL_DRM_ARM |
|
case AV_HWDEVICE_TYPE_DRM: |
|
if (!priv->drm_arm_mapping_usable) |
|
return AVERROR(ENOSYS); |
|
break; |
|
#endif |
|
default: |
|
return AVERROR(ENOSYS); |
|
} |
|
return opencl_frames_init_command_queue(dst_fc); |
|
} |
|
|
|
const HWContextType ff_hwcontext_type_opencl = { |
|
.type = AV_HWDEVICE_TYPE_OPENCL, |
|
.name = "OpenCL", |
|
|
|
.device_hwctx_size = sizeof(AVOpenCLDeviceContext), |
|
.device_priv_size = sizeof(OpenCLDeviceContext), |
|
.frames_hwctx_size = sizeof(AVOpenCLFramesContext), |
|
.frames_priv_size = sizeof(OpenCLFramesContext), |
|
|
|
.device_create = &opencl_device_create, |
|
.device_derive = &opencl_device_derive, |
|
.device_init = &opencl_device_init, |
|
.device_uninit = &opencl_device_uninit, |
|
|
|
.frames_get_constraints = &opencl_frames_get_constraints, |
|
.frames_init = &opencl_frames_init, |
|
.frames_uninit = &opencl_frames_uninit, |
|
.frames_get_buffer = &opencl_get_buffer, |
|
|
|
.transfer_get_formats = &opencl_transfer_get_formats, |
|
.transfer_data_to = &opencl_transfer_data_to, |
|
.transfer_data_from = &opencl_transfer_data_from, |
|
|
|
.map_from = &opencl_map_from, |
|
.map_to = &opencl_map_to, |
|
.frames_derive_to = &opencl_frames_derive_to, |
|
|
|
.pix_fmts = (const enum AVPixelFormat[]) { |
|
AV_PIX_FMT_OPENCL, |
|
AV_PIX_FMT_NONE |
|
}, |
|
};
|
|
|