FFmpeg/libavfilter/vf_derain.c

/*
 * Copyright (c) 2019 Xuewei Meng
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

/**
 * @file
 * Filter implementing image derain filter using deep convolutional networks.
 * http://openaccess.thecvf.com/content_ECCV_2018/html/Xia_Li_Recurrent_Squeeze-and-Excitation_Context_ECCV_2018_paper.html
 */

#include "libavformat/avio.h"
#include "libavutil/opt.h"
#include "avfilter.h"
#include "dnn_filter_common.h"
#include "formats.h"
#include "internal.h"

typedef struct DRContext {
    const AVClass *class;
    DnnContext dnnctx;
    int                filter_type;
} DRContext;

#define OFFSET(x) offsetof(DRContext, x)
#define FLAGS AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_VIDEO_PARAM
static const AVOption derain_options[] = {
    { "filter_type", "filter type(derain/dehaze)",  OFFSET(filter_type),    AV_OPT_TYPE_INT,    { .i64 = 0 },    0, 1, FLAGS, "type" },
    { "derain",      "derain filter flag",          0,                      AV_OPT_TYPE_CONST,  { .i64 = 0 },    0, 0, FLAGS, "type" },
    { "dehaze",      "dehaze filter flag",          0,                      AV_OPT_TYPE_CONST,  { .i64 = 1 },    0, 0, FLAGS, "type" },
    { "dnn_backend", "DNN backend",                 OFFSET(dnnctx.backend_type),   AV_OPT_TYPE_INT,    { .i64 = 0 },    0, 1, FLAGS, "backend" },
    { "native",      "native backend flag",         0,                      AV_OPT_TYPE_CONST,  { .i64 = 0 },    0, 0, FLAGS, "backend" },
#if (CONFIG_LIBTENSORFLOW == 1)
    { "tensorflow",  "tensorflow backend flag",     0,                      AV_OPT_TYPE_CONST,  { .i64 = 1 },    0, 0, FLAGS, "backend" },
#endif
    { "model",       "path to model file",          OFFSET(dnnctx.model_filename),   AV_OPT_TYPE_STRING,    { .str = NULL }, 0, 0, FLAGS },
    { "input",       "input name of the model",     OFFSET(dnnctx.model_inputname),  AV_OPT_TYPE_STRING,    { .str = "x" },  0, 0, FLAGS },
    { "output",      "output name of the model",    OFFSET(dnnctx.model_outputname), AV_OPT_TYPE_STRING,    { .str = "y" },  0, 0, FLAGS },
    { NULL }
};

AVFILTER_DEFINE_CLASS(derain);

static int query_formats(AVFilterContext *ctx)
{
    AVFilterFormats *formats;
    const enum AVPixelFormat pixel_fmts[] = {
        AV_PIX_FMT_RGB24,
        AV_PIX_FMT_NONE
    };

    formats = ff_make_format_list(pixel_fmts);

    return ff_set_common_formats(ctx, formats);
}

static int filter_frame(AVFilterLink *inlink, AVFrame *in)
{
    AVFilterContext *ctx  = inlink->dst;
    AVFilterLink *outlink = ctx->outputs[0];
    DRContext *dr_context = ctx->priv;
    DNNReturnType dnn_result;
    AVFrame *out;

    out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
    if (!out) {
        av_log(ctx, AV_LOG_ERROR, "could not allocate memory for output frame\n");
        av_frame_free(&in);
        return AVERROR(ENOMEM);
    }
    av_frame_copy_props(out, in);

    dnn_result = ff_dnn_execute_model(&dr_context->dnnctx, in, out);
    if (dnn_result != DNN_SUCCESS){
        av_log(ctx, AV_LOG_ERROR, "failed to execute model\n");
        av_frame_free(&in);
        return AVERROR(EIO);
    }

    av_frame_free(&in);

    return ff_filter_frame(outlink, out);
}

static av_cold int init(AVFilterContext *ctx)
{
    DRContext *dr_context = ctx->priv;
    return ff_dnn_init(&dr_context->dnnctx, DFT_PROCESS_FRAME, ctx);
}

static av_cold void uninit(AVFilterContext *ctx)
{
    DRContext *dr_context = ctx->priv;
    ff_dnn_uninit(&dr_context->dnnctx);
}

static const AVFilterPad derain_inputs[] = {
    {
        .name         = "default",
        .type         = AVMEDIA_TYPE_VIDEO,
        .filter_frame = filter_frame,
    },
    { NULL }
};

static const AVFilterPad derain_outputs[] = {
    {
        .name = "default",
        .type = AVMEDIA_TYPE_VIDEO,
    },
    { NULL }
};

AVFilter ff_vf_derain = {
    .name          = "derain",
    .description   = NULL_IF_CONFIG_SMALL("Apply derain filter to the input."),
    .priv_size     = sizeof(DRContext),
    .init          = init,
    .uninit        = uninit,
    .query_formats = query_formats,
    .inputs        = derain_inputs,
    .outputs       = derain_outputs,
    .priv_class    = &derain_class,
    .flags         = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC,
};
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`/*`
			`* Copyright (c) 2019 Xuewei Meng`
			`*`
			`* This file is part of FFmpeg.`
			`*`
			`* FFmpeg is free software; you can redistribute it and/or`
			`* modify it under the terms of the GNU Lesser General Public`
			`* License as published by the Free Software Foundation; either`
			`* version 2.1 of the License, or (at your option) any later version.`
			`*`
			`* FFmpeg is distributed in the hope that it will be useful,`
			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU`
			`* Lesser General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU Lesser General Public`
			`* License along with FFmpeg; if not, write to the Free Software`
			`* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA`
			`*/`

			`/**`
			`* @file`
			`* Filter implementing image derain filter using deep convolutional networks.`
			`* http://openaccess.thecvf.com/content_ECCV_2018/html/Xia_Li_Recurrent_Squeeze-and-Excitation_Context_ECCV_2018_paper.html`
			`*/`

			`#include "libavformat/avio.h"`
			`#include "libavutil/opt.h"`
			`#include "avfilter.h"`
dnn: extract common functions used by different filters Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-26 07:35:30 +02:00			`#include "dnn_filter_common.h"`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`#include "formats.h"`
			`#include "internal.h"`

			`typedef struct DRContext {`
			`const AVClass *class;`
dnn: extract common functions used by different filters Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-26 07:35:30 +02:00			`DnnContext dnnctx;`
libavfilter: Add dehaze-filter option in existing derain. Add the support of dehaze filter in existing derain filter source code. As the processing procedure in FFmpeg is the same for current derain and dehaze, we reuse the derain filter source code. The model training and generation scripts are in repo https://github.com/XueweiMeng/derain_filter.git Reviewed-by: Steven Liu <lq@onvideo.cn> Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-08-22 12:28:44 +02:00			`int filter_type;`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`} DRContext;`

			`#define OFFSET(x) offsetof(DRContext, x)`
			`#define FLAGS AV_OPT_FLAG_FILTERING_PARAM \| AV_OPT_FLAG_VIDEO_PARAM`
			`static const AVOption derain_options[] = {`
libavfilter: Add dehaze-filter option in existing derain. Add the support of dehaze filter in existing derain filter source code. As the processing procedure in FFmpeg is the same for current derain and dehaze, we reuse the derain filter source code. The model training and generation scripts are in repo https://github.com/XueweiMeng/derain_filter.git Reviewed-by: Steven Liu <lq@onvideo.cn> Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-08-22 12:28:44 +02:00			`{ "filter_type", "filter type(derain/dehaze)", OFFSET(filter_type), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, FLAGS, "type" },`
			`{ "derain", "derain filter flag", 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, 0, 0, FLAGS, "type" },`
			`{ "dehaze", "dehaze filter flag", 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, 0, 0, FLAGS, "type" },`
dnn: extract common functions used by different filters Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-26 07:35:30 +02:00			`{ "dnn_backend", "DNN backend", OFFSET(dnnctx.backend_type), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, FLAGS, "backend" },`
avfilter/vf_derain: reindent code after last commit Signed-off-by: Steven Liu <lq@chinaffmpeg.org> 2019-08-26 09:09:46 +02:00			`{ "native", "native backend flag", 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, 0, 0, FLAGS, "backend" },`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`#if (CONFIG_LIBTENSORFLOW == 1)`
avfilter/vf_derain: reindent code after last commit Signed-off-by: Steven Liu <lq@chinaffmpeg.org> 2019-08-26 09:09:46 +02:00			`{ "tensorflow", "tensorflow backend flag", 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, 0, 0, FLAGS, "backend" },`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`#endif`
dnn: extract common functions used by different filters Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-26 07:35:30 +02:00			`{ "model", "path to model file", OFFSET(dnnctx.model_filename), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, FLAGS },`
			`{ "input", "input name of the model", OFFSET(dnnctx.model_inputname), AV_OPT_TYPE_STRING, { .str = "x" }, 0, 0, FLAGS },`
			`{ "output", "output name of the model", OFFSET(dnnctx.model_outputname), AV_OPT_TYPE_STRING, { .str = "y" }, 0, 0, FLAGS },`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`{ NULL }`
			`};`

			`AVFILTER_DEFINE_CLASS(derain);`

			`static int query_formats(AVFilterContext *ctx)`
			`{`
			`AVFilterFormats *formats;`
			`const enum AVPixelFormat pixel_fmts[] = {`
			`AV_PIX_FMT_RGB24,`
			`AV_PIX_FMT_NONE`
			`};`

			`formats = ff_make_format_list(pixel_fmts);`

			`return ff_set_common_formats(ctx, formats);`
			`}`

			`static int filter_frame(AVFilterLink inlink, AVFrame in)`
			`{`
			`AVFilterContext *ctx = inlink->dst;`
			`AVFilterLink *outlink = ctx->outputs[0];`
			`DRContext *dr_context = ctx->priv;`
			`DNNReturnType dnn_result;`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 06:51:44 +02:00			`AVFrame *out;`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 06:51:44 +02:00			`out = ff_get_video_buffer(outlink, outlink->w, outlink->h);`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`if (!out) {`
			`av_log(ctx, AV_LOG_ERROR, "could not allocate memory for output frame\n");`
			`av_frame_free(&in);`
			`return AVERROR(ENOMEM);`
			`}`
			`av_frame_copy_props(out, in);`

dnn: extract common functions used by different filters Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-26 07:35:30 +02:00			`dnn_result = ff_dnn_execute_model(&dr_context->dnnctx, in, out);`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`if (dnn_result != DNN_SUCCESS){`
			`av_log(ctx, AV_LOG_ERROR, "failed to execute model\n");`
dnn: change dnn interface to replace DNNData* with AVFrame* Currently, every filter needs to provide code to transfer data from AVFrame* to model input (DNNData), and also from model output (DNNData) to AVFrame. Actually, such transfer can be implemented within DNN module, and so filter can focus on its own business logic. DNN module also exports the function pointer pre_proc and post_proc in struct DNNModel, just in case that a filter has its special logic to transfer data between AVFrame and DNNData*. The default implementation within DNN module is used if the filter does not set pre/post_proc. 2020-08-28 06:51:44 +02:00			`av_frame_free(&in);`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`return AVERROR(EIO);`
			`}`

			`av_frame_free(&in);`

			`return ff_filter_frame(outlink, out);`
			`}`

			`static av_cold int init(AVFilterContext *ctx)`
			`{`
			`DRContext *dr_context = ctx->priv;`
dnn: add function type for model So the backend knows the usage of model is for frame processing, detect, classify, etc. Each function type has different behavior in backend when handling the input/output data of the model. Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-02-07 08:35:22 +02:00			`return ff_dnn_init(&dr_context->dnnctx, DFT_PROCESS_FRAME, ctx);`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`}`

			`static av_cold void uninit(AVFilterContext *ctx)`
			`{`
			`DRContext *dr_context = ctx->priv;`
dnn: extract common functions used by different filters Signed-off-by: Guo, Yejun <yejun.guo@intel.com> 2021-01-26 07:35:30 +02:00			`ff_dnn_uninit(&dr_context->dnnctx);`
libavfilter: Add derain filter Remove the rain in the input image/video by applying the derain methods based on convolutional neural networks. Training scripts as well as scripts for model generation are provided in the repository at https://github.com/XueweiMeng/derain_filter.git. Signed-off-by: Xuewei Meng <xwmeng96@gmail.com> 2019-05-30 14:35:17 +02:00			`}`

			`static const AVFilterPad derain_inputs[] = {`
			`{`
			`.name = "default",`
			`.type = AVMEDIA_TYPE_VIDEO,`
			`.filter_frame = filter_frame,`
			`},`
			`{ NULL }`
			`};`

			`static const AVFilterPad derain_outputs[] = {`
			`{`
			`.name = "default",`
			`.type = AVMEDIA_TYPE_VIDEO,`
			`},`
			`{ NULL }`
			`};`

			`AVFilter ff_vf_derain = {`
			`.name = "derain",`
			`.description = NULL_IF_CONFIG_SMALL("Apply derain filter to the input."),`
			`.priv_size = sizeof(DRContext),`
			`.init = init,`
			`.uninit = uninit,`
			`.query_formats = query_formats,`
			`.inputs = derain_inputs,`
			`.outputs = derain_outputs,`
			`.priv_class = &derain_class,`
			`.flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC,`
			`};`