On 2017/6/28 5:50, Mark Thompson wrote:
> ---
>  libavfilter/Makefile         |   6 +
>  libavfilter/opencl.c         | 285 
> +++++++++++++++++++++++++++++++++++++++++++
>  libavfilter/opencl.h         |  74 +++++++++++
>  libavfilter/opencl/rgbyuv.cl | 117 ++++++++++++++++++
>  libavfilter/opencl_source.h  |  24 ++++
>  tools/cl2c                   |  20 +++
>  6 files changed, 526 insertions(+)

I guess we can give a general Colour Space Conversions solution based on 
OpenCL, now
I can think some case can't support in this patch. :) e,g:

- YUV422 <-> 420P
- 10bits <-> 8bits
...

>  create mode 100644 libavfilter/opencl.c
>  create mode 100644 libavfilter/opencl.h
>  create mode 100644 libavfilter/opencl/rgbyuv.cl
>  create mode 100644 libavfilter/opencl_source.h
>  create mode 100755 tools/cl2c
> 
> diff --git a/libavfilter/Makefile b/libavfilter/Makefile
> index 348ad9211..1370ef04b 100644
> --- a/libavfilter/Makefile
> +++ b/libavfilter/Makefile
> @@ -106,3 +106,9 @@ OBJS-$(CONFIG_TESTSRC_FILTER)                += 
> vsrc_testsrc.o
>  
>  TOOLS     = graph2dot
>  TESTPROGS = filtfmts
> +
> +OPENCL = $(subst $(SRC_PATH)/,,$(wildcard 
> $(SRC_PATH)/libavfilter/opencl/*.cl))
> +.SECONDARY: $(OPENCL:.cl=.c)
> +libavfilter/opencl/%.c: TAG = OPENCL
> +libavfilter/opencl/%.c: $(SRC_PATH)/libavfilter/opencl/%.cl
> +     $(M)$(SRC_PATH)/tools/cl2c $< $@
> diff --git a/libavfilter/opencl.c b/libavfilter/opencl.c
> new file mode 100644
> index 000000000..f7b3f1818
> --- /dev/null
> +++ b/libavfilter/opencl.c
> @@ -0,0 +1,285 @@
> +/*
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 
> USA
> + */
> +
> +#include <stdio.h>
> +#include <string.h>
> +
> +#include "libavutil/hwcontext.h"
> +#include "libavutil/hwcontext_opencl.h"
> +#include "libavutil/mem.h"
> +
> +#include "avfilter.h"
> +#include "formats.h"
> +#include "opencl.h"
> +
> +int ff_opencl_filter_query_formats(AVFilterContext *avctx)
> +{
> +    const static enum AVPixelFormat formats[] = {
> +        AV_PIX_FMT_OPENCL,
> +        AV_PIX_FMT_NONE,
> +    };
> +    int i;
> +
> +    for (i = 0; i < avctx->nb_inputs; i++) {
> +        ff_formats_ref(ff_make_format_list(formats),
> +                       &avctx->inputs[i]->out_formats);
> +    }
> +
> +    for (i = 0; i < avctx->nb_outputs; i++) {
> +        ff_formats_ref(ff_make_format_list(formats),
> +                       &avctx->outputs[i]->in_formats);
> +    }
> +
> +    return 0;
> +}
> +
> +int ff_opencl_filter_config_input(AVFilterLink *inlink)
> +{
> +    AVFilterContext   *avctx = inlink->dst;
> +    OpenCLFilterContext *ctx = avctx->priv;
> +    AVHWFramesContext *input_frames;
> +
> +    if (!inlink->hw_frames_ctx) {
> +        av_log(avctx, AV_LOG_ERROR, "OpenCL filtering requires a "
> +               "hardware frames context on the input.\n");
> +        return AVERROR(EINVAL);
> +    }
> +
> +    // Extract the device and default output format from the first input.
> +    if (avctx->inputs[0] != inlink)
> +        return 0;
> +
> +    input_frames = (AVHWFramesContext*)inlink->hw_frames_ctx->data;
> +
> +    if (input_frames->format != AV_PIX_FMT_OPENCL)
> +        return AVERROR(EINVAL);
> +
> +    ctx->device_ref = av_buffer_ref(input_frames->device_ref);
> +    if (!ctx->device_ref)
> +        return AVERROR(ENOMEM);
> +    ctx->device = input_frames->device_ctx;
> +    ctx->hwctx  = ctx->device->hwctx;
> +
> +    // Default output parameters match input parameters.
> +    if (ctx->output_format == AV_PIX_FMT_NONE)
> +        ctx->output_format = input_frames->sw_format;
> +    if (!ctx->output_width)
> +        ctx->output_width  = inlink->w;
> +    if (!ctx->output_height)
> +        ctx->output_height = inlink->h;
> +
> +    return 0;
> +}
> +
> +int ff_opencl_filter_config_output(AVFilterLink *outlink)
> +{
> +    AVFilterContext   *avctx = outlink->src;
> +    OpenCLFilterContext *ctx = avctx->priv;
> +    AVBufferRef       *output_frames_ref = NULL;
> +    AVHWFramesContext *output_frames;
> +    int err;
> +
> +    av_buffer_unref(&outlink->hw_frames_ctx);
> +
> +    output_frames_ref = av_hwframe_ctx_alloc(ctx->device_ref);
> +    if (!output_frames_ref) {
> +        err = AVERROR(ENOMEM);
> +        goto fail;
> +    }
> +    output_frames = (AVHWFramesContext*)output_frames_ref->data;
> +
> +    output_frames->format    = AV_PIX_FMT_OPENCL;
> +    output_frames->sw_format = ctx->output_format;
> +    output_frames->width     = ctx->output_width;
> +    output_frames->height    = ctx->output_height;
> +
> +    err = av_hwframe_ctx_init(output_frames_ref);
> +    if (err < 0) {
> +        av_log(avctx, AV_LOG_ERROR, "Failed to initialise output "
> +               "frames: %d.\n", err);
> +        goto fail;
> +    }
> +
> +    outlink->hw_frames_ctx = output_frames_ref;
> +    outlink->w = ctx->output_width;
> +    outlink->h = ctx->output_height;
> +
> +    return 0;
> +fail:
> +    av_buffer_unref(&output_frames_ref);
> +    return err;
> +}
> +
> +int ff_opencl_filter_init(AVFilterContext *avctx)
> +{
> +    OpenCLFilterContext *ctx = avctx->priv;
> +
> +    ctx->output_format = AV_PIX_FMT_NONE;
> +
> +    return 0;
> +}
> +
> +void ff_opencl_filter_uninit(AVFilterContext *avctx)
> +{
> +    OpenCLFilterContext *ctx = avctx->priv;
> +    cl_int cle;
> +
> +    if (ctx->program) {
> +        cle = clReleaseProgram(ctx->program);
> +        if (cle != CL_SUCCESS)
> +            av_log(avctx, AV_LOG_ERROR, "Failed to release "
> +                   "program: %d.\n", cle);
> +    }
> +
> +    av_buffer_unref(&ctx->device_ref);
> +}
> +
> +const char *ff_opencl_make_rgbyuv(const char *called_name,
> +                                  enum AVColorSpace colorspace,
> +                                  int to_yuv)
> +{
> +    const char *function;
> +    const char *suffix;
> +    char tmp[256];
> +
> +    if (to_yuv)
> +        function = "rgb_to_yuv";
> +    else
> +        function = "yuv_to_rgb";
> +
> +    switch (colorspace) {
> +    case AVCOL_SPC_BT709:
> +    default:
> +        suffix = "bt709";
> +        break;
> +    case AVCOL_SPC_BT470BG:
> +        suffix = "bt470bg";
> +        break;
> +    case AVCOL_SPC_SMPTE170M:
> +    case AVCOL_SPC_SMPTE240M:
> +        suffix = "smpte170m";
> +        break;
> +    case AVCOL_SPC_BT2020_NCL:
> +    case AVCOL_SPC_BT2020_CL:
> +        suffix = "bt2020";
> +        break;
> +    }
> +
> +    snprintf(tmp, sizeof(tmp), "#line %d \"%s\"\n"
> +             "#define %s_%s %s_%s\n", __LINE__, __FILE__,
> +             function, called_name, function, suffix);
> +
> +    return av_strdup(tmp);
> +}
> +
> +static int opencl_filter_load_program(AVFilterContext *avctx,
> +                                      const char **program_source_array,
> +                                      int nb_strings)
> +{
> +    OpenCLFilterContext *ctx = avctx->priv;
> +    cl_int cle;
> +
> +    ctx->program = clCreateProgramWithSource(ctx->hwctx->context, nb_strings,
> +                                             program_source_array,
> +                                             NULL, &cle);
> +    if (!ctx->program) {
> +        av_log(avctx, AV_LOG_ERROR, "Failed to create program: %d.\n", cle);
> +        return AVERROR(EIO);
> +    }
> +
> +    cle = clBuildProgram(ctx->program, 1, &ctx->hwctx->device_id,
> +                         NULL, NULL, NULL);
> +    if (cle != CL_SUCCESS) {
> +        av_log(avctx, AV_LOG_ERROR, "Failed to build program: %d.\n", cle);
> +
> +        if (cle == CL_BUILD_PROGRAM_FAILURE) {
> +            char *log;
> +            size_t log_length;
> +
> +            clGetProgramBuildInfo(ctx->program, ctx->hwctx->device_id,
> +                                  CL_PROGRAM_BUILD_LOG, 0, NULL, 
> &log_length);
> +
> +            log = av_malloc(log_length);
> +            if (log) {
> +                cle = clGetProgramBuildInfo(ctx->program,
> +                                            ctx->hwctx->device_id,
> +                                            CL_PROGRAM_BUILD_LOG,
> +                                            log_length, log, NULL);
> +                if (cle == CL_SUCCESS)
> +                    av_log(avctx, AV_LOG_ERROR, "Build log:\n%s\n", log);
> +            }
> +
> +            av_free(log);
> +        }
> +
> +        clReleaseProgram(ctx->program);
> +        return AVERROR(EIO);
> +    }
> +
> +    return 0;
> +}
> +
> +int ff_opencl_filter_load_program(AVFilterContext *avctx,
> +                                  const char **program_source_array,
> +                                  int nb_strings)
> +{
> +    return opencl_filter_load_program(avctx, program_source_array, 
> nb_strings);
> +}
> +
> +int ff_opencl_filter_load_program_from_file(AVFilterContext *avctx,
> +                                            const char *filename)
> +{
> +    FILE *file;
> +    char *src = NULL;
> +    size_t pos, len, rb;
> +    const char *src_const;
> +    int err;
> +
> +    file = fopen(filename, "r");
> +    if (!file) {
> +        av_log(avctx, AV_LOG_ERROR, "Unable to open program "
> +               "source file \"%s\".\n", filename);
> +        return AVERROR(ENOENT);
> +    }
> +
> +    len = 1 << 16;
> +    pos = 0;
> +    while (1) {
> +        err = av_reallocp(&src, len);
> +        if (err < 0)
> +            goto fail;
> +        rb = fread(src + pos, 1, len - pos - 1, file);
> +        if (rb == 0 && ferror(file)) {
> +            err = AVERROR(EIO);
> +            goto fail;
> +        }
> +        pos += rb;
> +        if (pos < len)
> +            break;
> +        len <<= 1;
> +    }
> +    src[pos] = 0;
> +
> +    src_const = src;
> +
> +    err = opencl_filter_load_program(avctx, &src_const, 1);
> +fail:
> +    fclose(file);
> +    av_freep(&src);
> +    return err;
> +}
> diff --git a/libavfilter/opencl.h b/libavfilter/opencl.h
> new file mode 100644
> index 000000000..5b6caa0f2
> --- /dev/null
> +++ b/libavfilter/opencl.h
> @@ -0,0 +1,74 @@
> +/*
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 
> USA
> + */
> +
> +#ifndef AVFILTER_OPENCL_H
> +#define AVFILTER_OPENCL_H
> +
> +#include "libavutil/buffer.h"
> +#include "libavutil/hwcontext.h"
> +#include "libavutil/hwcontext_opencl.h"
> +#include "libavutil/pixfmt.h"
> +
> +#include "avfilter.h"
> +
> +typedef struct OpenCLFilterContext {
> +    const AVClass     *class;
> +
> +    AVBufferRef       *device_ref;
> +    AVHWDeviceContext *device;
> +    AVOpenCLDeviceContext *hwctx;
> +
> +    cl_program         program;
> +
> +    enum AVPixelFormat output_format;
> +    int                output_width;
> +    int                output_height;
> +} OpenCLFilterContext;
> +
> +/**
> + * Return that all inputs and outputs support only AV_PIX_FMT_OPENCL.
> + */
> +int ff_opencl_filter_query_formats(AVFilterContext *avctx);
> +
> +/**
> + * Check that the input link contains a suitable hardware frames
> + * context and extract the device from it.
> + */
> +int ff_opencl_filter_config_input(AVFilterLink *inlink);
> +
> +/**
> + * Create a suitable hardware frames context for the output.
> + */
> +int ff_opencl_filter_config_output(AVFilterLink *outlink);
> +
> +int ff_opencl_filter_init(AVFilterContext *avctx);
> +
> +void ff_opencl_filter_uninit(AVFilterContext *avctx);
> +
> +int ff_opencl_filter_load_program(AVFilterContext *avctx,
> +                                  const char **program_source_array,
> +                                  int nb_strings);
> +
> +int ff_opencl_filter_load_program_from_file(AVFilterContext *avctx,
> +                                            const char *filename);
> +
> +const char *ff_opencl_make_rgbyuv(const char *called_name,
> +                                  enum AVColorSpace colorspace,
> +                                  int to_yuv);
> +
> +#endif /* AVFILTER_OPENCL_H */
> diff --git a/libavfilter/opencl/rgbyuv.cl b/libavfilter/opencl/rgbyuv.cl
> new file mode 100644
> index 000000000..894905120
> --- /dev/null
> +++ b/libavfilter/opencl/rgbyuv.cl
> @@ -0,0 +1,117 @@
> +/*
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 
> USA
> + */
> +
> +static inline float4 yuv_to_rgb_bt470bg(float4 yuv)
> +{
> +    float4 yuv2r = (float4)(1.0,  0.0,   +1.140, 0.0);
> +    float4 yuv2g = (float4)(1.0, -0.396, -0.581, 0.0);
> +    float4 yuv2b = (float4)(1.0, +2.029,  0.0,   0.0);
> +    float4 rgb;
> +    yuv -= (float4)(0.0, 0.5, 0.5, 0.0);
> +    rgb.x = dot(yuv, yuv2r);
> +    rgb.y = dot(yuv, yuv2g);
> +    rgb.z = dot(yuv, yuv2b);
> +    return rgb;
> +}
> +
> +static inline float4 rgb_to_yuv_bt470bg(float4 rgb)
> +{
> +    float4 rgb2y = (float4)(+0.299, +0.587, +0.114, 0.0);
> +    float4 rgb2u = (float4)(-0.147, -0.289, +0.436, 0.0);
> +    float4 rgb2v = (float4)(+0.615, -0.515, -0.100, 0.0);
> +    float4 yuv;
> +    yuv.x = dot(rgb, rgb2y);
> +    yuv.y = 0.5f + dot(rgb, rgb2u);
> +    yuv.z = 0.5f + dot(rgb, rgb2v);
> +    return yuv;
> +}
> +
> +static inline float4 yuv_to_rgb_smpte170m(float4 yuv)
> +{
> +    float4 yuv2r = (float4)(1.0,  0.0,   +1.403, 0.0);
> +    float4 yuv2g = (float4)(1.0, -0.344, -0.714, 0.0);
> +    float4 yuv2b = (float4)(1.0, +1.773,  0.0,   0.0);
> +    float4 rgb;
> +    yuv -= (float4)(0.0, 0.5, 0.5, 0.0);
> +    rgb.x = dot(yuv, yuv2r);
> +    rgb.y = dot(yuv, yuv2g);
> +    rgb.z = dot(yuv, yuv2b);
> +    return rgb;
> +}
> +
> +static inline float4 rgb_to_yuv_smpte170m(float4 rgb)
> +{
> +    float4 rgb2y = (float4)(+0.299, +0.587, +0.114, 0.0);
> +    float4 rgb2u = (float4)(-0.169, -0.331, +0.500, 0.0);
> +    float4 rgb2v = (float4)(+0.500, -0.419, -0.081, 0.0);
> +    float4 yuv;
> +    yuv.x = dot(rgb, rgb2y);
> +    yuv.y = 0.5f + dot(rgb, rgb2u);
> +    yuv.z = 0.5f + dot(rgb, rgb2v);
> +    return yuv;
> +}
> +
> +static inline float4 yuv_to_rgb_bt709(float4 yuv)
> +{
> +    float4 yuv2r = (float4)(1.0,  0.0,    +1.5701, 0.0);
> +    float4 yuv2g = (float4)(1.0, -0.1870, -0.4664, 0.0);
> +    float4 yuv2b = (float4)(1.0, +1.8556,  0.0,    0.0);
> +    float4 rgb;
> +    yuv -= (float4)(0.0, 0.5, 0.5, 0.0);
> +    rgb.x = dot(yuv, yuv2r);
> +    rgb.y = dot(yuv, yuv2g);
> +    rgb.z = dot(yuv, yuv2b);
> +    return rgb;
> +}
> +
> +static inline float4 rgb_to_yuv_bt709(float4 rgb)
> +{
> +    float4 rgb2y = (float4)(+0.2215, +0.7154, +0.0721, 0.0);
> +    float4 rgb2u = (float4)(-0.1145, -0.3855, +0.5000, 0.0);
> +    float4 rgb2v = (float4)(+0.5016, -0.4556, -0.0459, 0.0);
> +    float4 yuv;
> +    yuv.x = dot(rgb, rgb2y);
> +    yuv.y = 0.5f + dot(rgb, rgb2u);
> +    yuv.z = 0.5f + dot(rgb, rgb2v);
> +    return yuv;
> +}
> +
> +static inline float4 yuv_to_rgb_bt2020(float4 yuv)
> +{
> +    float4 yuv2r = (float4)(1.0,  0.0,     +1.4746,  0.0);
> +    float4 yuv2g = (float4)(1.0, -0.16455, -0.57135, 0.0);
> +    float4 yuv2b = (float4)(1.0, +1.8814,   0.0,     0.0);
> +    float4 rgb;
> +    yuv -= (float4)(0.0, 0.5, 0.5, 0.0);
> +    rgb.x = dot(yuv, yuv2r);
> +    rgb.y = dot(yuv, yuv2g);
> +    rgb.z = dot(yuv, yuv2b);
> +    return rgb;
> +}
> +
> +static inline float4 rgb_to_yuv_bt2020(float4 rgb)
> +{
> +    float4 rgb2y = (float4)(+0.2627,  +0.6780,  +0.0593,  0.0);
> +    float4 rgb2u = (float4)(-0.13963, -0.36037, +0.5,     0.0);
> +    float4 rgb2v = (float4)(+0.5,     -0.45979, -0.04021, 0.0);
> +    float4 yuv;
> +    yuv.x = dot(rgb, rgb2y);
> +    yuv.y = 0.5f + dot(rgb, rgb2u);
> +    yuv.z = 0.5f + dot(rgb, rgb2v);
> +    return yuv;
> +}
> diff --git a/libavfilter/opencl_source.h b/libavfilter/opencl_source.h
> new file mode 100644
> index 000000000..d66c0b182
> --- /dev/null
> +++ b/libavfilter/opencl_source.h
> @@ -0,0 +1,24 @@
> +/*
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 
> USA
> + */
> +
> +#ifndef AVFILTER_OPENCL_SOURCE_H
> +#define AVFILTER_OPENCL_SOURCE_H
> +
> +extern const char *ff_opencl_source_rgbyuv;
> +
> +#endif /* AVFILTER_OPENCL_SOURCE_H */
> diff --git a/tools/cl2c b/tools/cl2c
> new file mode 100755
> index 000000000..1ead94081
> --- /dev/null
> +++ b/tools/cl2c
> @@ -0,0 +1,20 @@
> +#!/bin/sh
> +# Convert an OpenCL source file into a C source file containing the
> +# OpenCL source as a C string.  Also adds a #line directive so that
> +# compiler messages are useful.
> +
> +input="$1"
> +output="$2"
> +
> +name=$(basename "$input" | sed 's/.cl$//')
> +
> +cat >$output <<EOF
> +// Generated from $input
> +const char *ff_opencl_source_$name =
> +"#line 1 \"$input\"\n"
> +EOF
> +
> +# Convert \ to \\ and " to \", then add " to the start and end of the line.
> +cat "$input" | sed 's/\\/\\\\/g;s/\"/\\\"/g;s/^/\"/;s/$/\\n\"/' >>$output
> +
> +echo ";" >>$output
> 
_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel

Reply via email to