mirror of https://github.com/FFmpeg/FFmpeg.git
347 lines
9.9 KiB
347 lines
9.9 KiB
/* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
#include <stdio.h> |
|
#include <string.h> |
|
|
|
#include "libavutil/file_open.h" |
|
#include "libavutil/mem.h" |
|
#include "libavutil/pixdesc.h" |
|
|
|
#include "opencl.h" |
|
|
|
static int opencl_filter_set_device(AVFilterContext *avctx, |
|
AVBufferRef *device) |
|
{ |
|
OpenCLFilterContext *ctx = avctx->priv; |
|
|
|
av_buffer_unref(&ctx->device_ref); |
|
|
|
ctx->device_ref = av_buffer_ref(device); |
|
if (!ctx->device_ref) |
|
return AVERROR(ENOMEM); |
|
|
|
ctx->device = (AVHWDeviceContext*)ctx->device_ref->data; |
|
ctx->hwctx = ctx->device->hwctx; |
|
|
|
return 0; |
|
} |
|
|
|
int ff_opencl_filter_config_input(AVFilterLink *inlink) |
|
{ |
|
AVFilterContext *avctx = inlink->dst; |
|
OpenCLFilterContext *ctx = avctx->priv; |
|
AVHWFramesContext *input_frames; |
|
int err; |
|
|
|
if (!inlink->hw_frames_ctx) { |
|
av_log(avctx, AV_LOG_ERROR, "OpenCL filtering requires a " |
|
"hardware frames context on the input.\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
// Extract the device and default output format from the first input. |
|
if (avctx->inputs[0] != inlink) |
|
return 0; |
|
|
|
input_frames = (AVHWFramesContext*)inlink->hw_frames_ctx->data; |
|
if (input_frames->format != AV_PIX_FMT_OPENCL) |
|
return AVERROR(EINVAL); |
|
|
|
err = opencl_filter_set_device(avctx, input_frames->device_ref); |
|
if (err < 0) |
|
return err; |
|
|
|
// Default output parameters match input parameters. |
|
if (ctx->output_format == AV_PIX_FMT_NONE) |
|
ctx->output_format = input_frames->sw_format; |
|
if (!ctx->output_width) |
|
ctx->output_width = inlink->w; |
|
if (!ctx->output_height) |
|
ctx->output_height = inlink->h; |
|
|
|
return 0; |
|
} |
|
|
|
int ff_opencl_filter_config_output(AVFilterLink *outlink) |
|
{ |
|
AVFilterContext *avctx = outlink->src; |
|
OpenCLFilterContext *ctx = avctx->priv; |
|
AVBufferRef *output_frames_ref = NULL; |
|
AVHWFramesContext *output_frames; |
|
int err; |
|
|
|
av_buffer_unref(&outlink->hw_frames_ctx); |
|
|
|
if (!ctx->device_ref) { |
|
if (!avctx->hw_device_ctx) { |
|
av_log(avctx, AV_LOG_ERROR, "OpenCL filtering requires an " |
|
"OpenCL device.\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
err = opencl_filter_set_device(avctx, avctx->hw_device_ctx); |
|
if (err < 0) |
|
return err; |
|
} |
|
|
|
output_frames_ref = av_hwframe_ctx_alloc(ctx->device_ref); |
|
if (!output_frames_ref) { |
|
err = AVERROR(ENOMEM); |
|
goto fail; |
|
} |
|
output_frames = (AVHWFramesContext*)output_frames_ref->data; |
|
|
|
output_frames->format = AV_PIX_FMT_OPENCL; |
|
output_frames->sw_format = ctx->output_format; |
|
output_frames->width = ctx->output_width; |
|
output_frames->height = ctx->output_height; |
|
|
|
err = av_hwframe_ctx_init(output_frames_ref); |
|
if (err < 0) { |
|
av_log(avctx, AV_LOG_ERROR, "Failed to initialise output " |
|
"frames: %d.\n", err); |
|
goto fail; |
|
} |
|
|
|
outlink->hw_frames_ctx = output_frames_ref; |
|
outlink->w = ctx->output_width; |
|
outlink->h = ctx->output_height; |
|
|
|
return 0; |
|
fail: |
|
av_buffer_unref(&output_frames_ref); |
|
return err; |
|
} |
|
|
|
int ff_opencl_filter_init(AVFilterContext *avctx) |
|
{ |
|
OpenCLFilterContext *ctx = avctx->priv; |
|
|
|
ctx->output_format = AV_PIX_FMT_NONE; |
|
|
|
return 0; |
|
} |
|
|
|
void ff_opencl_filter_uninit(AVFilterContext *avctx) |
|
{ |
|
OpenCLFilterContext *ctx = avctx->priv; |
|
cl_int cle; |
|
|
|
if (ctx->program) { |
|
cle = clReleaseProgram(ctx->program); |
|
if (cle != CL_SUCCESS) |
|
av_log(avctx, AV_LOG_ERROR, "Failed to release " |
|
"program: %d.\n", cle); |
|
} |
|
|
|
av_buffer_unref(&ctx->device_ref); |
|
} |
|
|
|
int ff_opencl_filter_load_program(AVFilterContext *avctx, |
|
const char **program_source_array, |
|
int nb_strings) |
|
{ |
|
OpenCLFilterContext *ctx = avctx->priv; |
|
cl_int cle; |
|
|
|
ctx->program = clCreateProgramWithSource(ctx->hwctx->context, nb_strings, |
|
program_source_array, |
|
NULL, &cle); |
|
if (!ctx->program) { |
|
av_log(avctx, AV_LOG_ERROR, "Failed to create program: %d.\n", cle); |
|
return AVERROR(EIO); |
|
} |
|
|
|
cle = clBuildProgram(ctx->program, 1, &ctx->hwctx->device_id, |
|
NULL, NULL, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(avctx, AV_LOG_ERROR, "Failed to build program: %d.\n", cle); |
|
|
|
if (cle == CL_BUILD_PROGRAM_FAILURE) { |
|
char *log; |
|
size_t log_length; |
|
|
|
clGetProgramBuildInfo(ctx->program, ctx->hwctx->device_id, |
|
CL_PROGRAM_BUILD_LOG, 0, NULL, &log_length); |
|
|
|
log = av_malloc(log_length); |
|
if (log) { |
|
cle = clGetProgramBuildInfo(ctx->program, |
|
ctx->hwctx->device_id, |
|
CL_PROGRAM_BUILD_LOG, |
|
log_length, log, NULL); |
|
if (cle == CL_SUCCESS) |
|
av_log(avctx, AV_LOG_ERROR, "Build log:\n%s\n", log); |
|
} |
|
|
|
av_free(log); |
|
} |
|
|
|
clReleaseProgram(ctx->program); |
|
ctx->program = NULL; |
|
return AVERROR(EIO); |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
int ff_opencl_filter_load_program_from_file(AVFilterContext *avctx, |
|
const char *filename) |
|
{ |
|
FILE *file; |
|
char *src = NULL; |
|
size_t pos, len, rb; |
|
const char *src_const; |
|
int err; |
|
|
|
file = avpriv_fopen_utf8(filename, "r"); |
|
if (!file) { |
|
av_log(avctx, AV_LOG_ERROR, "Unable to open program " |
|
"source file \"%s\".\n", filename); |
|
return AVERROR(ENOENT); |
|
} |
|
|
|
len = 1 << 16; |
|
pos = 0; |
|
|
|
err = av_reallocp(&src, len); |
|
if (err < 0) |
|
goto fail; |
|
|
|
err = snprintf(src, len, "#line 1 \"%s\"\n", filename); |
|
if (err < 0) { |
|
err = AVERROR(errno); |
|
goto fail; |
|
} |
|
if (err > len / 2) { |
|
err = AVERROR(EINVAL); |
|
goto fail; |
|
} |
|
pos = err; |
|
|
|
while (1) { |
|
rb = fread(src + pos, 1, len - pos - 1, file); |
|
if (rb == 0 && ferror(file)) { |
|
err = AVERROR(EIO); |
|
goto fail; |
|
} |
|
pos += rb; |
|
if (pos + 1 < len) |
|
break; |
|
len <<= 1; |
|
err = av_reallocp(&src, len); |
|
if (err < 0) |
|
goto fail; |
|
} |
|
src[pos] = 0; |
|
|
|
src_const = src; |
|
|
|
err = ff_opencl_filter_load_program(avctx, &src_const, 1); |
|
fail: |
|
fclose(file); |
|
av_freep(&src); |
|
return err; |
|
} |
|
|
|
int ff_opencl_filter_work_size_from_image(AVFilterContext *avctx, |
|
size_t *work_size, |
|
AVFrame *frame, int plane, |
|
int block_alignment) |
|
{ |
|
cl_mem image; |
|
cl_mem_object_type type; |
|
size_t width, height; |
|
cl_int cle; |
|
|
|
if (frame->format != AV_PIX_FMT_OPENCL) { |
|
av_log(avctx, AV_LOG_ERROR, "Invalid frame format %s, " |
|
"opencl required.\n", av_get_pix_fmt_name(frame->format)); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
image = (cl_mem)frame->data[plane]; |
|
if (!image) { |
|
av_log(avctx, AV_LOG_ERROR, "Plane %d required but not set.\n", |
|
plane); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
cle = clGetMemObjectInfo(image, CL_MEM_TYPE, sizeof(type), |
|
&type, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(avctx, AV_LOG_ERROR, "Failed to query object type of " |
|
"plane %d: %d.\n", plane, cle); |
|
return AVERROR_UNKNOWN; |
|
} |
|
if (type != CL_MEM_OBJECT_IMAGE2D) { |
|
av_log(avctx, AV_LOG_ERROR, "Plane %d is not a 2D image.\n", |
|
plane); |
|
return AVERROR(EINVAL); |
|
} |
|
|
|
cle = clGetImageInfo(image, CL_IMAGE_WIDTH, sizeof(size_t), |
|
&width, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(avctx, AV_LOG_ERROR, "Failed to query plane %d width: %d.\n", |
|
plane, cle); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
cle = clGetImageInfo(image, CL_IMAGE_HEIGHT, sizeof(size_t), |
|
&height, NULL); |
|
if (cle != CL_SUCCESS) { |
|
av_log(avctx, AV_LOG_ERROR, "Failed to query plane %d height: %d.\n", |
|
plane, cle); |
|
return AVERROR_UNKNOWN; |
|
} |
|
|
|
if (block_alignment) { |
|
width = FFALIGN(width, block_alignment); |
|
height = FFALIGN(height, block_alignment); |
|
} |
|
|
|
work_size[0] = width; |
|
work_size[1] = height; |
|
|
|
return 0; |
|
} |
|
|
|
void ff_opencl_print_const_matrix_3x3(AVBPrint *buf, const char *name_str, |
|
double mat[3][3]) |
|
{ |
|
int i, j; |
|
av_bprintf(buf, "__constant float %s[9] = {\n", name_str); |
|
for (i = 0; i < 3; i++) { |
|
for (j = 0; j < 3; j++) |
|
av_bprintf(buf, " %.5ff,", mat[i][j]); |
|
av_bprintf(buf, "\n"); |
|
} |
|
av_bprintf(buf, "};\n"); |
|
} |
|
|
|
cl_ulong ff_opencl_get_event_time(cl_event event) { |
|
cl_ulong time_start; |
|
cl_ulong time_end; |
|
|
|
clGetEventProfilingInfo(event, CL_PROFILING_COMMAND_START, sizeof(time_start), &time_start, NULL); |
|
clGetEventProfilingInfo(event, CL_PROFILING_COMMAND_END, sizeof(time_end), &time_end, NULL); |
|
|
|
return time_end - time_start; |
|
}
|
|
|