ffmpeg/libavfilter/opencl.c

348 lines
9.9 KiB
C

/*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include <stdio.h>
#include <string.h>
#include "libavutil/mem.h"
#include "libavutil/pixdesc.h"
#include "formats.h"
#include "opencl.h"
static int opencl_filter_set_device(AVFilterContext *avctx,
AVBufferRef *device)
{
OpenCLFilterContext *ctx = avctx->priv;
av_buffer_unref(&ctx->device_ref);
ctx->device_ref = av_buffer_ref(device);
if (!ctx->device_ref)
return AVERROR(ENOMEM);
ctx->device = (AVHWDeviceContext*)ctx->device_ref->data;
ctx->hwctx = ctx->device->hwctx;
return 0;
}
int ff_opencl_filter_config_input(AVFilterLink *inlink)
{
AVFilterContext *avctx = inlink->dst;
OpenCLFilterContext *ctx = avctx->priv;
AVHWFramesContext *input_frames;
int err;
if (!inlink->hw_frames_ctx) {
av_log(avctx, AV_LOG_ERROR, "OpenCL filtering requires a "
"hardware frames context on the input.\n");
return AVERROR(EINVAL);
}
// Extract the device and default output format from the first input.
if (avctx->inputs[0] != inlink)
return 0;
input_frames = (AVHWFramesContext*)inlink->hw_frames_ctx->data;
if (input_frames->format != AV_PIX_FMT_OPENCL)
return AVERROR(EINVAL);
err = opencl_filter_set_device(avctx, input_frames->device_ref);
if (err < 0)
return err;
// Default output parameters match input parameters.
if (ctx->output_format == AV_PIX_FMT_NONE)
ctx->output_format = input_frames->sw_format;
if (!ctx->output_width)
ctx->output_width = inlink->w;
if (!ctx->output_height)
ctx->output_height = inlink->h;
return 0;
}
int ff_opencl_filter_config_output(AVFilterLink *outlink)
{
AVFilterContext *avctx = outlink->src;
OpenCLFilterContext *ctx = avctx->priv;
AVBufferRef *output_frames_ref = NULL;
AVHWFramesContext *output_frames;
int err;
av_buffer_unref(&outlink->hw_frames_ctx);
if (!ctx->device_ref) {
if (!avctx->hw_device_ctx) {
av_log(avctx, AV_LOG_ERROR, "OpenCL filtering requires an "
"OpenCL device.\n");
return AVERROR(EINVAL);
}
err = opencl_filter_set_device(avctx, avctx->hw_device_ctx);
if (err < 0)
return err;
}
output_frames_ref = av_hwframe_ctx_alloc(ctx->device_ref);
if (!output_frames_ref) {
err = AVERROR(ENOMEM);
goto fail;
}
output_frames = (AVHWFramesContext*)output_frames_ref->data;
output_frames->format = AV_PIX_FMT_OPENCL;
output_frames->sw_format = ctx->output_format;
output_frames->width = ctx->output_width;
output_frames->height = ctx->output_height;
err = av_hwframe_ctx_init(output_frames_ref);
if (err < 0) {
av_log(avctx, AV_LOG_ERROR, "Failed to initialise output "
"frames: %d.\n", err);
goto fail;
}
outlink->hw_frames_ctx = output_frames_ref;
outlink->w = ctx->output_width;
outlink->h = ctx->output_height;
return 0;
fail:
av_buffer_unref(&output_frames_ref);
return err;
}
int ff_opencl_filter_init(AVFilterContext *avctx)
{
OpenCLFilterContext *ctx = avctx->priv;
ctx->output_format = AV_PIX_FMT_NONE;
return 0;
}
void ff_opencl_filter_uninit(AVFilterContext *avctx)
{
OpenCLFilterContext *ctx = avctx->priv;
cl_int cle;
if (ctx->program) {
cle = clReleaseProgram(ctx->program);
if (cle != CL_SUCCESS)
av_log(avctx, AV_LOG_ERROR, "Failed to release "
"program: %d.\n", cle);
}
av_buffer_unref(&ctx->device_ref);
}
int ff_opencl_filter_load_program(AVFilterContext *avctx,
const char **program_source_array,
int nb_strings)
{
OpenCLFilterContext *ctx = avctx->priv;
cl_int cle;
ctx->program = clCreateProgramWithSource(ctx->hwctx->context, nb_strings,
program_source_array,
NULL, &cle);
if (!ctx->program) {
av_log(avctx, AV_LOG_ERROR, "Failed to create program: %d.\n", cle);
return AVERROR(EIO);
}
cle = clBuildProgram(ctx->program, 1, &ctx->hwctx->device_id,
NULL, NULL, NULL);
if (cle != CL_SUCCESS) {
av_log(avctx, AV_LOG_ERROR, "Failed to build program: %d.\n", cle);
if (cle == CL_BUILD_PROGRAM_FAILURE) {
char *log;
size_t log_length;
clGetProgramBuildInfo(ctx->program, ctx->hwctx->device_id,
CL_PROGRAM_BUILD_LOG, 0, NULL, &log_length);
log = av_malloc(log_length);
if (log) {
cle = clGetProgramBuildInfo(ctx->program,
ctx->hwctx->device_id,
CL_PROGRAM_BUILD_LOG,
log_length, log, NULL);
if (cle == CL_SUCCESS)
av_log(avctx, AV_LOG_ERROR, "Build log:\n%s\n", log);
}
av_free(log);
}
clReleaseProgram(ctx->program);
ctx->program = NULL;
return AVERROR(EIO);
}
return 0;
}
int ff_opencl_filter_load_program_from_file(AVFilterContext *avctx,
const char *filename)
{
FILE *file;
char *src = NULL;
size_t pos, len, rb;
const char *src_const;
int err;
file = avpriv_fopen_utf8(filename, "r");
if (!file) {
av_log(avctx, AV_LOG_ERROR, "Unable to open program "
"source file \"%s\".\n", filename);
return AVERROR(ENOENT);
}
len = 1 << 16;
pos = 0;
err = av_reallocp(&src, len);
if (err < 0)
goto fail;
err = snprintf(src, len, "#line 1 \"%s\"\n", filename);
if (err < 0) {
err = AVERROR(errno);
goto fail;
}
if (err > len / 2) {
err = AVERROR(EINVAL);
goto fail;
}
pos = err;
while (1) {
rb = fread(src + pos, 1, len - pos - 1, file);
if (rb == 0 && ferror(file)) {
err = AVERROR(EIO);
goto fail;
}
pos += rb;
if (pos + 1 < len)
break;
len <<= 1;
err = av_reallocp(&src, len);
if (err < 0)
goto fail;
}
src[pos] = 0;
src_const = src;
err = ff_opencl_filter_load_program(avctx, &src_const, 1);
fail:
fclose(file);
av_freep(&src);
return err;
}
int ff_opencl_filter_work_size_from_image(AVFilterContext *avctx,
size_t *work_size,
AVFrame *frame, int plane,
int block_alignment)
{
cl_mem image;
cl_mem_object_type type;
size_t width, height;
cl_int cle;
if (frame->format != AV_PIX_FMT_OPENCL) {
av_log(avctx, AV_LOG_ERROR, "Invalid frame format %s, "
"opencl required.\n", av_get_pix_fmt_name(frame->format));
return AVERROR(EINVAL);
}
image = (cl_mem)frame->data[plane];
if (!image) {
av_log(avctx, AV_LOG_ERROR, "Plane %d required but not set.\n",
plane);
return AVERROR(EINVAL);
}
cle = clGetMemObjectInfo(image, CL_MEM_TYPE, sizeof(type),
&type, NULL);
if (cle != CL_SUCCESS) {
av_log(avctx, AV_LOG_ERROR, "Failed to query object type of "
"plane %d: %d.\n", plane, cle);
return AVERROR_UNKNOWN;
}
if (type != CL_MEM_OBJECT_IMAGE2D) {
av_log(avctx, AV_LOG_ERROR, "Plane %d is not a 2D image.\n",
plane);
return AVERROR(EINVAL);
}
cle = clGetImageInfo(image, CL_IMAGE_WIDTH, sizeof(size_t),
&width, NULL);
if (cle != CL_SUCCESS) {
av_log(avctx, AV_LOG_ERROR, "Failed to query plane %d width: %d.\n",
plane, cle);
return AVERROR_UNKNOWN;
}
cle = clGetImageInfo(image, CL_IMAGE_HEIGHT, sizeof(size_t),
&height, NULL);
if (cle != CL_SUCCESS) {
av_log(avctx, AV_LOG_ERROR, "Failed to query plane %d height: %d.\n",
plane, cle);
return AVERROR_UNKNOWN;
}
if (block_alignment) {
width = FFALIGN(width, block_alignment);
height = FFALIGN(height, block_alignment);
}
work_size[0] = width;
work_size[1] = height;
return 0;
}
void ff_opencl_print_const_matrix_3x3(AVBPrint *buf, const char *name_str,
double mat[3][3])
{
int i, j;
av_bprintf(buf, "__constant float %s[9] = {\n", name_str);
for (i = 0; i < 3; i++) {
for (j = 0; j < 3; j++)
av_bprintf(buf, " %.5ff,", mat[i][j]);
av_bprintf(buf, "\n");
}
av_bprintf(buf, "};\n");
}
cl_ulong ff_opencl_get_event_time(cl_event event) {
cl_ulong time_start;
cl_ulong time_end;
clGetEventProfilingInfo(event, CL_PROFILING_COMMAND_START, sizeof(time_start), &time_start, NULL);
clGetEventProfilingInfo(event, CL_PROFILING_COMMAND_END, sizeof(time_end), &time_end, NULL);
return time_end - time_start;
}