---
libavfilter/Makefile | 6 +
libavfilter/opencl.c | 285 +++++++++++++++++++++++++++++++++++++++++++
libavfilter/opencl.h | 74 +++++++++++
libavfilter/opencl/rgbyuv.cl | 117 ++++++++++++++++++
libavfilter/opencl_source.h | 24 ++++
tools/cl2c | 20 +++
6 files changed, 526 insertions(+)
create mode 100644 libavfilter/opencl.c
create mode 100644 libavfilter/opencl.h
create mode 100644 libavfilter/opencl/rgbyuv.cl
create mode 100644 libavfilter/opencl_source.h
create mode 100755 tools/cl2c
diff --git a/libavfilter/Makefile b/libavfilter/Makefile
index 348ad9211..1370ef04b 100644
--- a/libavfilter/Makefile
+++ b/libavfilter/Makefile
@@ -106,3 +106,9 @@ OBJS-$(CONFIG_TESTSRC_FILTER) +=
vsrc_testsrc.o
TOOLS = graph2dot
TESTPROGS = filtfmts
+
+OPENCL = $(subst $(SRC_PATH)/,,$(wildcard $(SRC_PATH)/libavfilter/opencl/*.cl))
+.SECONDARY: $(OPENCL:.cl=.c)
+libavfilter/opencl/%.c: TAG = OPENCL
+libavfilter/opencl/%.c: $(SRC_PATH)/libavfilter/opencl/%.cl
+ $(M)$(SRC_PATH)/tools/cl2c $< $@
diff --git a/libavfilter/opencl.c b/libavfilter/opencl.c
new file mode 100644
index 000000000..f7b3f1818
--- /dev/null
+++ b/libavfilter/opencl.c
@@ -0,0 +1,285 @@
+/*
+ * This file is part of Libav.
+ *
+ * Libav is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * Libav is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with Libav; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#include <stdio.h>
+#include <string.h>
+
+#include "libavutil/hwcontext.h"
+#include "libavutil/hwcontext_opencl.h"
+#include "libavutil/mem.h"
+
+#include "avfilter.h"
+#include "formats.h"
+#include "opencl.h"
+
+int ff_opencl_filter_query_formats(AVFilterContext *avctx)
+{
+ const static enum AVPixelFormat formats[] = {
+ AV_PIX_FMT_OPENCL,
+ AV_PIX_FMT_NONE,
+ };
+ int i;
+
+ for (i = 0; i < avctx->nb_inputs; i++) {
+ ff_formats_ref(ff_make_format_list(formats),
+ &avctx->inputs[i]->out_formats);
+ }
+
+ for (i = 0; i < avctx->nb_outputs; i++) {
+ ff_formats_ref(ff_make_format_list(formats),
+ &avctx->outputs[i]->in_formats);
+ }
+
+ return 0;
+}
+
+int ff_opencl_filter_config_input(AVFilterLink *inlink)
+{
+ AVFilterContext *avctx = inlink->dst;
+ OpenCLFilterContext *ctx = avctx->priv;
+ AVHWFramesContext *input_frames;
+
+ if (!inlink->hw_frames_ctx) {
+ av_log(avctx, AV_LOG_ERROR, "OpenCL filtering requires a "
+ "hardware frames context on the input.\n");
+ return AVERROR(EINVAL);
+ }
+
+ // Extract the device and default output format from the first input.
+ if (avctx->inputs[0] != inlink)
+ return 0;
+
+ input_frames = (AVHWFramesContext*)inlink->hw_frames_ctx->data;
+
+ if (input_frames->format != AV_PIX_FMT_OPENCL)
+ return AVERROR(EINVAL);
+
+ ctx->device_ref = av_buffer_ref(input_frames->device_ref);
+ if (!ctx->device_ref)
+ return AVERROR(ENOMEM);
+ ctx->device = input_frames->device_ctx;
+ ctx->hwctx = ctx->device->hwctx;
+
+ // Default output parameters match input parameters.
+ if (ctx->output_format == AV_PIX_FMT_NONE)
+ ctx->output_format = input_frames->sw_format;
+ if (!ctx->output_width)
+ ctx->output_width = inlink->w;
+ if (!ctx->output_height)
+ ctx->output_height = inlink->h;
+
+ return 0;
+}
+
+int ff_opencl_filter_config_output(AVFilterLink *outlink)
+{
+ AVFilterContext *avctx = outlink->src;
+ OpenCLFilterContext *ctx = avctx->priv;
+ AVBufferRef *output_frames_ref = NULL;
+ AVHWFramesContext *output_frames;
+ int err;
+
+ av_buffer_unref(&outlink->hw_frames_ctx);
+
+ output_frames_ref = av_hwframe_ctx_alloc(ctx->device_ref);
+ if (!output_frames_ref) {
+ err = AVERROR(ENOMEM);
+ goto fail;
+ }
+ output_frames = (AVHWFramesContext*)output_frames_ref->data;
+
+ output_frames->format = AV_PIX_FMT_OPENCL;
+ output_frames->sw_format = ctx->output_format;
+ output_frames->width = ctx->output_width;
+ output_frames->height = ctx->output_height;
+
+ err = av_hwframe_ctx_init(output_frames_ref);
+ if (err < 0) {
+ av_log(avctx, AV_LOG_ERROR, "Failed to initialise output "
+ "frames: %d.\n", err);
+ goto fail;
+ }
+
+ outlink->hw_frames_ctx = output_frames_ref;
+ outlink->w = ctx->output_width;
+ outlink->h = ctx->output_height;
+
+ return 0;
+fail:
+ av_buffer_unref(&output_frames_ref);
+ return err;
+}
+
+int ff_opencl_filter_init(AVFilterContext *avctx)
+{
+ OpenCLFilterContext *ctx = avctx->priv;
+
+ ctx->output_format = AV_PIX_FMT_NONE;
+
+ return 0;
+}
+
+void ff_opencl_filter_uninit(AVFilterContext *avctx)
+{
+ OpenCLFilterContext *ctx = avctx->priv;
+ cl_int cle;
+
+ if (ctx->program) {
+ cle = clReleaseProgram(ctx->program);
+ if (cle != CL_SUCCESS)
+ av_log(avctx, AV_LOG_ERROR, "Failed to release "
+ "program: %d.\n", cle);
+ }
+
+ av_buffer_unref(&ctx->device_ref);
+}
+
+const char *ff_opencl_make_rgbyuv(const char *called_name,
+ enum AVColorSpace colorspace,
+ int to_yuv)
+{
+ const char *function;
+ const char *suffix;
+ char tmp[256];
+
+ if (to_yuv)
+ function = "rgb_to_yuv";
+ else
+ function = "yuv_to_rgb";
+
+ switch (colorspace) {
+ case AVCOL_SPC_BT709:
+ default:
+ suffix = "bt709";
+ break;
+ case AVCOL_SPC_BT470BG:
+ suffix = "bt470bg";
+ break;
+ case AVCOL_SPC_SMPTE170M:
+ case AVCOL_SPC_SMPTE240M:
+ suffix = "smpte170m";
+ break;
+ case AVCOL_SPC_BT2020_NCL:
+ case AVCOL_SPC_BT2020_CL:
+ suffix = "bt2020";
+ break;
+ }
+
+ snprintf(tmp, sizeof(tmp), "#line %d \"%s\"\n"
+ "#define %s_%s %s_%s\n", __LINE__, __FILE__,
+ function, called_name, function, suffix);
+
+ return av_strdup(tmp);
+}
+
+static int opencl_filter_load_program(AVFilterContext *avctx,
+ const char **program_source_array,
+ int nb_strings)
+{
+ OpenCLFilterContext *ctx = avctx->priv;
+ cl_int cle;
+
+ ctx->program = clCreateProgramWithSource(ctx->hwctx->context, nb_strings,
+ program_source_array,
+ NULL, &cle);
+ if (!ctx->program) {
+ av_log(avctx, AV_LOG_ERROR, "Failed to create program: %d.\n", cle);
+ return AVERROR(EIO);
+ }
+
+ cle = clBuildProgram(ctx->program, 1, &ctx->hwctx->device_id,
+ NULL, NULL, NULL);
+ if (cle != CL_SUCCESS) {
+ av_log(avctx, AV_LOG_ERROR, "Failed to build program: %d.\n", cle);
+
+ if (cle == CL_BUILD_PROGRAM_FAILURE) {
+ char *log;
+ size_t log_length;
+
+ clGetProgramBuildInfo(ctx->program, ctx->hwctx->device_id,
+ CL_PROGRAM_BUILD_LOG, 0, NULL, &log_length);
+
+ log = av_malloc(log_length);
+ if (log) {
+ cle = clGetProgramBuildInfo(ctx->program,
+ ctx->hwctx->device_id,
+ CL_PROGRAM_BUILD_LOG,
+ log_length, log, NULL);
+ if (cle == CL_SUCCESS)
+ av_log(avctx, AV_LOG_ERROR, "Build log:\n%s\n", log);
+ }
+
+ av_free(log);
+ }
+
+ clReleaseProgram(ctx->program);
+ return AVERROR(EIO);
+ }
+
+ return 0;
+}
+
+int ff_opencl_filter_load_program(AVFilterContext *avctx,
+ const char **program_source_array,
+ int nb_strings)
+{
+ return opencl_filter_load_program(avctx, program_source_array, nb_strings);
+}
+
+int ff_opencl_filter_load_program_from_file(AVFilterContext *avctx,
+ const char *filename)
+{
+ FILE *file;
+ char *src = NULL;
+ size_t pos, len, rb;
+ const char *src_const;
+ int err;
+
+ file = fopen(filename, "r");
+ if (!file) {
+ av_log(avctx, AV_LOG_ERROR, "Unable to open program "
+ "source file \"%s\".\n", filename);
+ return AVERROR(ENOENT);
+ }
+
+ len = 1 << 16;
+ pos = 0;
+ while (1) {
+ err = av_reallocp(&src, len);
+ if (err < 0)
+ goto fail;
+ rb = fread(src + pos, 1, len - pos - 1, file);
+ if (rb == 0 && ferror(file)) {
+ err = AVERROR(EIO);
+ goto fail;
+ }
+ pos += rb;
+ if (pos < len)
+ break;
+ len <<= 1;
+ }
+ src[pos] = 0;
+
+ src_const = src;
+
+ err = opencl_filter_load_program(avctx, &src_const, 1);
+fail:
+ fclose(file);
+ av_freep(&src);
+ return err;
+}
diff --git a/libavfilter/opencl.h b/libavfilter/opencl.h
new file mode 100644
index 000000000..5b6caa0f2
--- /dev/null
+++ b/libavfilter/opencl.h
@@ -0,0 +1,74 @@
+/*
+ * This file is part of Libav.
+ *
+ * Libav is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * Libav is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with Libav; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#ifndef AVFILTER_OPENCL_H
+#define AVFILTER_OPENCL_H
+
+#include "libavutil/buffer.h"
+#include "libavutil/hwcontext.h"
+#include "libavutil/hwcontext_opencl.h"
+#include "libavutil/pixfmt.h"
+
+#include "avfilter.h"
+
+typedef struct OpenCLFilterContext {
+ const AVClass *class;
+
+ AVBufferRef *device_ref;
+ AVHWDeviceContext *device;
+ AVOpenCLDeviceContext *hwctx;
+
+ cl_program program;
+
+ enum AVPixelFormat output_format;
+ int output_width;
+ int output_height;
+} OpenCLFilterContext;
+
+/**
+ * Return that all inputs and outputs support only AV_PIX_FMT_OPENCL.
+ */
+int ff_opencl_filter_query_formats(AVFilterContext *avctx);
+
+/**
+ * Check that the input link contains a suitable hardware frames
+ * context and extract the device from it.
+ */
+int ff_opencl_filter_config_input(AVFilterLink *inlink);
+
+/**
+ * Create a suitable hardware frames context for the output.
+ */
+int ff_opencl_filter_config_output(AVFilterLink *outlink);
+
+int ff_opencl_filter_init(AVFilterContext *avctx);
+
+void ff_opencl_filter_uninit(AVFilterContext *avctx);
+
+int ff_opencl_filter_load_program(AVFilterContext *avctx,
+ const char **program_source_array,
+ int nb_strings);
+
+int ff_opencl_filter_load_program_from_file(AVFilterContext *avctx,
+ const char *filename);
+
+const char *ff_opencl_make_rgbyuv(const char *called_name,
+ enum AVColorSpace colorspace,
+ int to_yuv);
+
+#endif /* AVFILTER_OPENCL_H */
diff --git a/libavfilter/opencl/rgbyuv.cl b/libavfilter/opencl/rgbyuv.cl
new file mode 100644
index 000000000..894905120
--- /dev/null
+++ b/libavfilter/opencl/rgbyuv.cl
@@ -0,0 +1,117 @@
+/*
+ * This file is part of Libav.
+ *
+ * Libav is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * Libav is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with Libav; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+static inline float4 yuv_to_rgb_bt470bg(float4 yuv)
+{
+ float4 yuv2r = (float4)(1.0, 0.0, +1.140, 0.0);
+ float4 yuv2g = (float4)(1.0, -0.396, -0.581, 0.0);
+ float4 yuv2b = (float4)(1.0, +2.029, 0.0, 0.0);
+ float4 rgb;
+ yuv -= (float4)(0.0, 0.5, 0.5, 0.0);
+ rgb.x = dot(yuv, yuv2r);
+ rgb.y = dot(yuv, yuv2g);
+ rgb.z = dot(yuv, yuv2b);
+ return rgb;
+}
+
+static inline float4 rgb_to_yuv_bt470bg(float4 rgb)
+{
+ float4 rgb2y = (float4)(+0.299, +0.587, +0.114, 0.0);
+ float4 rgb2u = (float4)(-0.147, -0.289, +0.436, 0.0);
+ float4 rgb2v = (float4)(+0.615, -0.515, -0.100, 0.0);
+ float4 yuv;
+ yuv.x = dot(rgb, rgb2y);
+ yuv.y = 0.5f + dot(rgb, rgb2u);
+ yuv.z = 0.5f + dot(rgb, rgb2v);
+ return yuv;
+}
+
+static inline float4 yuv_to_rgb_smpte170m(float4 yuv)
+{
+ float4 yuv2r = (float4)(1.0, 0.0, +1.403, 0.0);
+ float4 yuv2g = (float4)(1.0, -0.344, -0.714, 0.0);
+ float4 yuv2b = (float4)(1.0, +1.773, 0.0, 0.0);
+ float4 rgb;
+ yuv -= (float4)(0.0, 0.5, 0.5, 0.0);
+ rgb.x = dot(yuv, yuv2r);
+ rgb.y = dot(yuv, yuv2g);
+ rgb.z = dot(yuv, yuv2b);
+ return rgb;
+}
+
+static inline float4 rgb_to_yuv_smpte170m(float4 rgb)
+{
+ float4 rgb2y = (float4)(+0.299, +0.587, +0.114, 0.0);
+ float4 rgb2u = (float4)(-0.169, -0.331, +0.500, 0.0);
+ float4 rgb2v = (float4)(+0.500, -0.419, -0.081, 0.0);
+ float4 yuv;
+ yuv.x = dot(rgb, rgb2y);
+ yuv.y = 0.5f + dot(rgb, rgb2u);
+ yuv.z = 0.5f + dot(rgb, rgb2v);
+ return yuv;
+}
+
+static inline float4 yuv_to_rgb_bt709(float4 yuv)
+{
+ float4 yuv2r = (float4)(1.0, 0.0, +1.5701, 0.0);
+ float4 yuv2g = (float4)(1.0, -0.1870, -0.4664, 0.0);
+ float4 yuv2b = (float4)(1.0, +1.8556, 0.0, 0.0);
+ float4 rgb;
+ yuv -= (float4)(0.0, 0.5, 0.5, 0.0);
+ rgb.x = dot(yuv, yuv2r);
+ rgb.y = dot(yuv, yuv2g);
+ rgb.z = dot(yuv, yuv2b);
+ return rgb;
+}
+
+static inline float4 rgb_to_yuv_bt709(float4 rgb)
+{
+ float4 rgb2y = (float4)(+0.2215, +0.7154, +0.0721, 0.0);
+ float4 rgb2u = (float4)(-0.1145, -0.3855, +0.5000, 0.0);
+ float4 rgb2v = (float4)(+0.5016, -0.4556, -0.0459, 0.0);
+ float4 yuv;
+ yuv.x = dot(rgb, rgb2y);
+ yuv.y = 0.5f + dot(rgb, rgb2u);
+ yuv.z = 0.5f + dot(rgb, rgb2v);
+ return yuv;
+}
+
+static inline float4 yuv_to_rgb_bt2020(float4 yuv)
+{
+ float4 yuv2r = (float4)(1.0, 0.0, +1.4746, 0.0);
+ float4 yuv2g = (float4)(1.0, -0.16455, -0.57135, 0.0);
+ float4 yuv2b = (float4)(1.0, +1.8814, 0.0, 0.0);
+ float4 rgb;
+ yuv -= (float4)(0.0, 0.5, 0.5, 0.0);
+ rgb.x = dot(yuv, yuv2r);
+ rgb.y = dot(yuv, yuv2g);
+ rgb.z = dot(yuv, yuv2b);
+ return rgb;
+}
+
+static inline float4 rgb_to_yuv_bt2020(float4 rgb)
+{
+ float4 rgb2y = (float4)(+0.2627, +0.6780, +0.0593, 0.0);
+ float4 rgb2u = (float4)(-0.13963, -0.36037, +0.5, 0.0);
+ float4 rgb2v = (float4)(+0.5, -0.45979, -0.04021, 0.0);
+ float4 yuv;
+ yuv.x = dot(rgb, rgb2y);
+ yuv.y = 0.5f + dot(rgb, rgb2u);
+ yuv.z = 0.5f + dot(rgb, rgb2v);
+ return yuv;
+}
diff --git a/libavfilter/opencl_source.h b/libavfilter/opencl_source.h
new file mode 100644
index 000000000..d66c0b182
--- /dev/null
+++ b/libavfilter/opencl_source.h
@@ -0,0 +1,24 @@
+/*
+ * This file is part of Libav.
+ *
+ * Libav is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * Libav is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with Libav; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#ifndef AVFILTER_OPENCL_SOURCE_H
+#define AVFILTER_OPENCL_SOURCE_H
+
+extern const char *ff_opencl_source_rgbyuv;
+
+#endif /* AVFILTER_OPENCL_SOURCE_H */
diff --git a/tools/cl2c b/tools/cl2c
new file mode 100755
index 000000000..1ead94081
--- /dev/null
+++ b/tools/cl2c
@@ -0,0 +1,20 @@
+#!/bin/sh
+# Convert an OpenCL source file into a C source file containing the
+# OpenCL source as a C string. Also adds a #line directive so that
+# compiler messages are useful.
+
+input="$1"
+output="$2"
+
+name=$(basename "$input" | sed 's/.cl$//')
+
+cat >$output <<EOF
+// Generated from $input
+const char *ff_opencl_source_$name =
+"#line 1 \"$input\"\n"
+EOF
+
+# Convert \ to \\ and " to \", then add " to the start and end of the line.
+cat "$input" | sed 's/\\/\\\\/g;s/\"/\\\"/g;s/^/\"/;s/$/\\n\"/' >>$output
+
+echo ";" >>$output
--
2.11.0
_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel