You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

111 lines
4.6KB

  1. /*
  2. * Copyright (c) 2018 Sergey Lavrushkin
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. /**
  21. * @file
  22. * DNN inference engine interface.
  23. */
  24. #ifndef AVFILTER_DNN_INTERFACE_H
  25. #define AVFILTER_DNN_INTERFACE_H
  26. #include <stdint.h>
  27. #include "libavutil/frame.h"
  28. #include "avfilter.h"
  29. typedef enum {DNN_SUCCESS, DNN_ERROR} DNNReturnType;
  30. typedef enum {DNN_NATIVE, DNN_TF, DNN_OV} DNNBackendType;
  31. typedef enum {DNN_FLOAT = 1, DNN_UINT8 = 4} DNNDataType;
  32. typedef enum {
  33. DCO_NONE,
  34. DCO_BGR,
  35. } DNNColorOrder;
  36. typedef enum {
  37. DAST_FAIL, // something wrong
  38. DAST_EMPTY_QUEUE, // no more inference result to get
  39. DAST_NOT_READY, // all queued inferences are not finished
  40. DAST_SUCCESS // got a result frame successfully
  41. } DNNAsyncStatusType;
  42. typedef enum {
  43. DFT_NONE,
  44. DFT_PROCESS_FRAME, // process the whole frame
  45. DFT_ANALYTICS_DETECT, // detect from the whole frame
  46. // we can add more such as detect_from_crop, classify_from_bbox, etc.
  47. }DNNFunctionType;
  48. typedef struct DNNData{
  49. void *data;
  50. int width, height, channels;
  51. // dt and order together decide the color format
  52. DNNDataType dt;
  53. DNNColorOrder order;
  54. } DNNData;
  55. typedef struct DNNModel{
  56. // Stores model that can be different for different backends.
  57. void *model;
  58. // Stores options when the model is executed by the backend
  59. const char *options;
  60. // Stores FilterContext used for the interaction between AVFrame and DNNData
  61. AVFilterContext *filter_ctx;
  62. // Stores function type of the model
  63. DNNFunctionType func_type;
  64. // Gets model input information
  65. // Just reuse struct DNNData here, actually the DNNData.data field is not needed.
  66. DNNReturnType (*get_input)(void *model, DNNData *input, const char *input_name);
  67. // Gets model output width/height with given input w/h
  68. DNNReturnType (*get_output)(void *model, const char *input_name, int input_width, int input_height,
  69. const char *output_name, int *output_width, int *output_height);
  70. // set the pre process to transfer data from AVFrame to DNNData
  71. // the default implementation within DNN is used if it is not provided by the filter
  72. int (*pre_proc)(AVFrame *frame_in, DNNData *model_input, AVFilterContext *filter_ctx);
  73. // set the post process to transfer data from DNNData to AVFrame
  74. // the default implementation within DNN is used if it is not provided by the filter
  75. int (*post_proc)(AVFrame *frame_out, DNNData *model_output, AVFilterContext *filter_ctx);
  76. } DNNModel;
  77. // Stores pointers to functions for loading, executing, freeing DNN models for one of the backends.
  78. typedef struct DNNModule{
  79. // Loads model and parameters from given file. Returns NULL if it is not possible.
  80. DNNModel *(*load_model)(const char *model_filename, DNNFunctionType func_type, const char *options, AVFilterContext *filter_ctx);
  81. // Executes model with specified input and output. Returns DNN_ERROR otherwise.
  82. DNNReturnType (*execute_model)(const DNNModel *model, const char *input_name, AVFrame *in_frame,
  83. const char **output_names, uint32_t nb_output, AVFrame *out_frame);
  84. // Executes model with specified input and output asynchronously. Returns DNN_ERROR otherwise.
  85. DNNReturnType (*execute_model_async)(const DNNModel *model, const char *input_name, AVFrame *in_frame,
  86. const char **output_names, uint32_t nb_output, AVFrame *out_frame);
  87. // Retrieve inference result.
  88. DNNAsyncStatusType (*get_async_result)(const DNNModel *model, AVFrame **in, AVFrame **out);
  89. // Flush all the pending tasks.
  90. DNNReturnType (*flush)(const DNNModel *model);
  91. // Frees memory allocated for model.
  92. void (*free_model)(DNNModel **model);
  93. } DNNModule;
  94. // Initializes DNNModule depending on chosen backend.
  95. DNNModule *ff_get_dnn_module(DNNBackendType backend_type);
  96. #endif