mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-01-13 21:28:01 +02:00
dnn: add function type for model
So the backend knows the usage of model is for frame processing, detect, classify, etc. Each function type has different behavior in backend when handling the input/output data of the model. Signed-off-by: Guo, Yejun <yejun.guo@intel.com>
This commit is contained in:
parent
bdce636100
commit
76fc6879e2
@ -112,7 +112,7 @@ static DNNReturnType get_output_native(void *model, const char *input_name, int
|
|||||||
// layers_num,layer_type,layer_parameterss,layer_type,layer_parameters...
|
// layers_num,layer_type,layer_parameterss,layer_type,layer_parameters...
|
||||||
// For CONV layer: activation_function, input_num, output_num, kernel_size, kernel, biases
|
// For CONV layer: activation_function, input_num, output_num, kernel_size, kernel, biases
|
||||||
// For DEPTH_TO_SPACE layer: block_size
|
// For DEPTH_TO_SPACE layer: block_size
|
||||||
DNNModel *ff_dnn_load_model_native(const char *model_filename, const char *options, AVFilterContext *filter_ctx)
|
DNNModel *ff_dnn_load_model_native(const char *model_filename, DNNFunctionType func_type, const char *options, AVFilterContext *filter_ctx)
|
||||||
{
|
{
|
||||||
DNNModel *model = NULL;
|
DNNModel *model = NULL;
|
||||||
char header_expected[] = "FFMPEGDNNNATIVE";
|
char header_expected[] = "FFMPEGDNNNATIVE";
|
||||||
@ -256,6 +256,7 @@ DNNModel *ff_dnn_load_model_native(const char *model_filename, const char *optio
|
|||||||
model->get_input = &get_input_native;
|
model->get_input = &get_input_native;
|
||||||
model->get_output = &get_output_native;
|
model->get_output = &get_output_native;
|
||||||
model->filter_ctx = filter_ctx;
|
model->filter_ctx = filter_ctx;
|
||||||
|
model->func_type = func_type;
|
||||||
|
|
||||||
return model;
|
return model;
|
||||||
|
|
||||||
|
@ -128,7 +128,7 @@ typedef struct NativeModel{
|
|||||||
int32_t operands_num;
|
int32_t operands_num;
|
||||||
} NativeModel;
|
} NativeModel;
|
||||||
|
|
||||||
DNNModel *ff_dnn_load_model_native(const char *model_filename, const char *options, AVFilterContext *filter_ctx);
|
DNNModel *ff_dnn_load_model_native(const char *model_filename, DNNFunctionType func_type, const char *options, AVFilterContext *filter_ctx);
|
||||||
|
|
||||||
DNNReturnType ff_dnn_execute_model_native(const DNNModel *model, const char *input_name, AVFrame *in_frame,
|
DNNReturnType ff_dnn_execute_model_native(const DNNModel *model, const char *input_name, AVFrame *in_frame,
|
||||||
const char **output_names, uint32_t nb_output, AVFrame *out_frame);
|
const char **output_names, uint32_t nb_output, AVFrame *out_frame);
|
||||||
|
@ -524,7 +524,7 @@ static DNNReturnType get_output_ov(void *model, const char *input_name, int inpu
|
|||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
DNNModel *ff_dnn_load_model_ov(const char *model_filename, const char *options, AVFilterContext *filter_ctx)
|
DNNModel *ff_dnn_load_model_ov(const char *model_filename, DNNFunctionType func_type, const char *options, AVFilterContext *filter_ctx)
|
||||||
{
|
{
|
||||||
DNNModel *model = NULL;
|
DNNModel *model = NULL;
|
||||||
OVModel *ov_model = NULL;
|
OVModel *ov_model = NULL;
|
||||||
@ -572,6 +572,7 @@ DNNModel *ff_dnn_load_model_ov(const char *model_filename, const char *options,
|
|||||||
model->get_output = &get_output_ov;
|
model->get_output = &get_output_ov;
|
||||||
model->options = options;
|
model->options = options;
|
||||||
model->filter_ctx = filter_ctx;
|
model->filter_ctx = filter_ctx;
|
||||||
|
model->func_type = func_type;
|
||||||
|
|
||||||
return model;
|
return model;
|
||||||
|
|
||||||
|
@ -29,7 +29,7 @@
|
|||||||
|
|
||||||
#include "../dnn_interface.h"
|
#include "../dnn_interface.h"
|
||||||
|
|
||||||
DNNModel *ff_dnn_load_model_ov(const char *model_filename, const char *options, AVFilterContext *filter_ctx);
|
DNNModel *ff_dnn_load_model_ov(const char *model_filename, DNNFunctionType func_type, const char *options, AVFilterContext *filter_ctx);
|
||||||
|
|
||||||
DNNReturnType ff_dnn_execute_model_ov(const DNNModel *model, const char *input_name, AVFrame *in_frame,
|
DNNReturnType ff_dnn_execute_model_ov(const DNNModel *model, const char *input_name, AVFrame *in_frame,
|
||||||
const char **output_names, uint32_t nb_output, AVFrame *out_frame);
|
const char **output_names, uint32_t nb_output, AVFrame *out_frame);
|
||||||
|
@ -580,7 +580,7 @@ static DNNReturnType load_native_model(TFModel *tf_model, const char *model_file
|
|||||||
DNNModel *model = NULL;
|
DNNModel *model = NULL;
|
||||||
NativeModel *native_model;
|
NativeModel *native_model;
|
||||||
|
|
||||||
model = ff_dnn_load_model_native(model_filename, NULL, NULL);
|
model = ff_dnn_load_model_native(model_filename, DFT_PROCESS_FRAME, NULL, NULL);
|
||||||
if (!model){
|
if (!model){
|
||||||
av_log(ctx, AV_LOG_ERROR, "Failed to load native model\n");
|
av_log(ctx, AV_LOG_ERROR, "Failed to load native model\n");
|
||||||
return DNN_ERROR;
|
return DNN_ERROR;
|
||||||
@ -664,7 +664,7 @@ static DNNReturnType load_native_model(TFModel *tf_model, const char *model_file
|
|||||||
return DNN_SUCCESS;
|
return DNN_SUCCESS;
|
||||||
}
|
}
|
||||||
|
|
||||||
DNNModel *ff_dnn_load_model_tf(const char *model_filename, const char *options, AVFilterContext *filter_ctx)
|
DNNModel *ff_dnn_load_model_tf(const char *model_filename, DNNFunctionType func_type, const char *options, AVFilterContext *filter_ctx)
|
||||||
{
|
{
|
||||||
DNNModel *model = NULL;
|
DNNModel *model = NULL;
|
||||||
TFModel *tf_model = NULL;
|
TFModel *tf_model = NULL;
|
||||||
@ -705,6 +705,7 @@ DNNModel *ff_dnn_load_model_tf(const char *model_filename, const char *options,
|
|||||||
model->get_output = &get_output_tf;
|
model->get_output = &get_output_tf;
|
||||||
model->options = options;
|
model->options = options;
|
||||||
model->filter_ctx = filter_ctx;
|
model->filter_ctx = filter_ctx;
|
||||||
|
model->func_type = func_type;
|
||||||
|
|
||||||
return model;
|
return model;
|
||||||
}
|
}
|
||||||
|
@ -29,7 +29,7 @@
|
|||||||
|
|
||||||
#include "../dnn_interface.h"
|
#include "../dnn_interface.h"
|
||||||
|
|
||||||
DNNModel *ff_dnn_load_model_tf(const char *model_filename, const char *options, AVFilterContext *filter_ctx);
|
DNNModel *ff_dnn_load_model_tf(const char *model_filename, DNNFunctionType func_type, const char *options, AVFilterContext *filter_ctx);
|
||||||
|
|
||||||
DNNReturnType ff_dnn_execute_model_tf(const DNNModel *model, const char *input_name, AVFrame *in_frame,
|
DNNReturnType ff_dnn_execute_model_tf(const DNNModel *model, const char *input_name, AVFrame *in_frame,
|
||||||
const char **output_names, uint32_t nb_output, AVFrame *out_frame);
|
const char **output_names, uint32_t nb_output, AVFrame *out_frame);
|
||||||
|
@ -18,7 +18,7 @@
|
|||||||
|
|
||||||
#include "dnn_filter_common.h"
|
#include "dnn_filter_common.h"
|
||||||
|
|
||||||
int ff_dnn_init(DnnContext *ctx, AVFilterContext *filter_ctx)
|
int ff_dnn_init(DnnContext *ctx, DNNFunctionType func_type, AVFilterContext *filter_ctx)
|
||||||
{
|
{
|
||||||
if (!ctx->model_filename) {
|
if (!ctx->model_filename) {
|
||||||
av_log(filter_ctx, AV_LOG_ERROR, "model file for network is not specified\n");
|
av_log(filter_ctx, AV_LOG_ERROR, "model file for network is not specified\n");
|
||||||
@ -43,7 +43,7 @@ int ff_dnn_init(DnnContext *ctx, AVFilterContext *filter_ctx)
|
|||||||
return AVERROR(EINVAL);
|
return AVERROR(EINVAL);
|
||||||
}
|
}
|
||||||
|
|
||||||
ctx->model = (ctx->dnn_module->load_model)(ctx->model_filename, ctx->backend_options, filter_ctx);
|
ctx->model = (ctx->dnn_module->load_model)(ctx->model_filename, func_type, ctx->backend_options, filter_ctx);
|
||||||
if (!ctx->model) {
|
if (!ctx->model) {
|
||||||
av_log(filter_ctx, AV_LOG_ERROR, "could not load DNN model\n");
|
av_log(filter_ctx, AV_LOG_ERROR, "could not load DNN model\n");
|
||||||
return AVERROR(EINVAL);
|
return AVERROR(EINVAL);
|
||||||
|
@ -47,7 +47,7 @@ typedef struct DnnContext {
|
|||||||
{ "async", "use DNN async inference", OFFSET(async), AV_OPT_TYPE_BOOL, { .i64 = 1}, 0, 1, FLAGS},
|
{ "async", "use DNN async inference", OFFSET(async), AV_OPT_TYPE_BOOL, { .i64 = 1}, 0, 1, FLAGS},
|
||||||
|
|
||||||
|
|
||||||
int ff_dnn_init(DnnContext *ctx, AVFilterContext *filter_ctx);
|
int ff_dnn_init(DnnContext *ctx, DNNFunctionType func_type, AVFilterContext *filter_ctx);
|
||||||
DNNReturnType ff_dnn_get_input(DnnContext *ctx, DNNData *input);
|
DNNReturnType ff_dnn_get_input(DnnContext *ctx, DNNData *input);
|
||||||
DNNReturnType ff_dnn_get_output(DnnContext *ctx, int input_width, int input_height, int *output_width, int *output_height);
|
DNNReturnType ff_dnn_get_output(DnnContext *ctx, int input_width, int input_height, int *output_width, int *output_height);
|
||||||
DNNReturnType ff_dnn_execute_model(DnnContext *ctx, AVFrame *in_frame, AVFrame *out_frame);
|
DNNReturnType ff_dnn_execute_model(DnnContext *ctx, AVFrame *in_frame, AVFrame *out_frame);
|
||||||
|
@ -43,6 +43,13 @@ typedef enum {
|
|||||||
DAST_SUCCESS // got a result frame successfully
|
DAST_SUCCESS // got a result frame successfully
|
||||||
} DNNAsyncStatusType;
|
} DNNAsyncStatusType;
|
||||||
|
|
||||||
|
typedef enum {
|
||||||
|
DFT_NONE,
|
||||||
|
DFT_PROCESS_FRAME, // process the whole frame
|
||||||
|
DFT_ANALYTICS_DETECT, // detect from the whole frame
|
||||||
|
// we can add more such as detect_from_crop, classify_from_bbox, etc.
|
||||||
|
}DNNFunctionType;
|
||||||
|
|
||||||
typedef struct DNNData{
|
typedef struct DNNData{
|
||||||
void *data;
|
void *data;
|
||||||
DNNDataType dt;
|
DNNDataType dt;
|
||||||
@ -56,6 +63,8 @@ typedef struct DNNModel{
|
|||||||
const char *options;
|
const char *options;
|
||||||
// Stores FilterContext used for the interaction between AVFrame and DNNData
|
// Stores FilterContext used for the interaction between AVFrame and DNNData
|
||||||
AVFilterContext *filter_ctx;
|
AVFilterContext *filter_ctx;
|
||||||
|
// Stores function type of the model
|
||||||
|
DNNFunctionType func_type;
|
||||||
// Gets model input information
|
// Gets model input information
|
||||||
// Just reuse struct DNNData here, actually the DNNData.data field is not needed.
|
// Just reuse struct DNNData here, actually the DNNData.data field is not needed.
|
||||||
DNNReturnType (*get_input)(void *model, DNNData *input, const char *input_name);
|
DNNReturnType (*get_input)(void *model, DNNData *input, const char *input_name);
|
||||||
@ -73,7 +82,7 @@ typedef struct DNNModel{
|
|||||||
// Stores pointers to functions for loading, executing, freeing DNN models for one of the backends.
|
// Stores pointers to functions for loading, executing, freeing DNN models for one of the backends.
|
||||||
typedef struct DNNModule{
|
typedef struct DNNModule{
|
||||||
// Loads model and parameters from given file. Returns NULL if it is not possible.
|
// Loads model and parameters from given file. Returns NULL if it is not possible.
|
||||||
DNNModel *(*load_model)(const char *model_filename, const char *options, AVFilterContext *filter_ctx);
|
DNNModel *(*load_model)(const char *model_filename, DNNFunctionType func_type, const char *options, AVFilterContext *filter_ctx);
|
||||||
// Executes model with specified input and output. Returns DNN_ERROR otherwise.
|
// Executes model with specified input and output. Returns DNN_ERROR otherwise.
|
||||||
DNNReturnType (*execute_model)(const DNNModel *model, const char *input_name, AVFrame *in_frame,
|
DNNReturnType (*execute_model)(const DNNModel *model, const char *input_name, AVFrame *in_frame,
|
||||||
const char **output_names, uint32_t nb_output, AVFrame *out_frame);
|
const char **output_names, uint32_t nb_output, AVFrame *out_frame);
|
||||||
|
@ -100,7 +100,7 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in)
|
|||||||
static av_cold int init(AVFilterContext *ctx)
|
static av_cold int init(AVFilterContext *ctx)
|
||||||
{
|
{
|
||||||
DRContext *dr_context = ctx->priv;
|
DRContext *dr_context = ctx->priv;
|
||||||
return ff_dnn_init(&dr_context->dnnctx, ctx);
|
return ff_dnn_init(&dr_context->dnnctx, DFT_PROCESS_FRAME, ctx);
|
||||||
}
|
}
|
||||||
|
|
||||||
static av_cold void uninit(AVFilterContext *ctx)
|
static av_cold void uninit(AVFilterContext *ctx)
|
||||||
|
@ -62,7 +62,7 @@ AVFILTER_DEFINE_CLASS(dnn_processing);
|
|||||||
static av_cold int init(AVFilterContext *context)
|
static av_cold int init(AVFilterContext *context)
|
||||||
{
|
{
|
||||||
DnnProcessingContext *ctx = context->priv;
|
DnnProcessingContext *ctx = context->priv;
|
||||||
return ff_dnn_init(&ctx->dnnctx, context);
|
return ff_dnn_init(&ctx->dnnctx, DFT_PROCESS_FRAME, context);
|
||||||
}
|
}
|
||||||
|
|
||||||
static int query_formats(AVFilterContext *context)
|
static int query_formats(AVFilterContext *context)
|
||||||
|
@ -63,7 +63,7 @@ AVFILTER_DEFINE_CLASS(sr);
|
|||||||
static av_cold int init(AVFilterContext *context)
|
static av_cold int init(AVFilterContext *context)
|
||||||
{
|
{
|
||||||
SRContext *sr_context = context->priv;
|
SRContext *sr_context = context->priv;
|
||||||
return ff_dnn_init(&sr_context->dnnctx, context);
|
return ff_dnn_init(&sr_context->dnnctx, DFT_PROCESS_FRAME, context);
|
||||||
}
|
}
|
||||||
|
|
||||||
static int query_formats(AVFilterContext *context)
|
static int query_formats(AVFilterContext *context)
|
||||||
|
Loading…
Reference in New Issue
Block a user