avfilter/dnn: unify the layer execution function in native mode

author Guo, Yejun <yejun.guo@intel.com>

Wed, 9 Oct 2019 14:08:11 +0000 (22:08 +0800)

committer Pedro Arthur <bygrandao@gmail.com>

Tue, 15 Oct 2019 21:56:25 +0000 (18:56 -0300)
author Guo, Yejun <yejun.guo@intel.com>
Wed, 9 Oct 2019 14:08:11 +0000 (22:08 +0800)
committer Pedro Arthur <bygrandao@gmail.com>
Tue, 15 Oct 2019 21:56:25 +0000 (18:56 -0300)
diff --git a/libavfilter/dnn/Makefile b/libavfilter/dnn/Makefile

index 721094ddc83c194260a48bab34eb55c12726bcfb..171f00e502d6391111d4e3fc95fb31f98b3c4ab6 100644 (file)
--- a/libavfilter/dnn/Makefile
+++ b/libavfilter/dnn/Makefile
@@ -1,5 +1,6 @@
  OBJS-$(CONFIG_DNN)                           += dnn/dnn_interface.o
  OBJS-$(CONFIG_DNN)                           += dnn/dnn_backend_native.o
+OBJS-$(CONFIG_DNN)                           += dnn/dnn_backend_native_layers.o
  OBJS-$(CONFIG_DNN)                           += dnn/dnn_backend_native_layer_pad.o
  OBJS-$(CONFIG_DNN)                           += dnn/dnn_backend_native_layer_conv2d.o
  OBJS-$(CONFIG_DNN)                           += dnn/dnn_backend_native_layer_depth2space.o
diff --git a/libavfilter/dnn/dnn_backend_native.c b/libavfilter/dnn/dnn_backend_native.c

index 97549d3077c910af437b3550caefd1dcb2bfc9b7..c8fb956dec8c1392ab469ff9b4930e3c5dd76673 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native.c
+++ b/libavfilter/dnn/dnn_backend_native.c
@@ -29,6 +29,7 @@
  #include "dnn_backend_native_layer_conv2d.h"
  #include "dnn_backend_native_layer_depth2space.h"
  #include "dnn_backend_native_layer_maximum.h"
+#include "dnn_backend_native_layers.h"
  
  static DNNReturnType set_input_output_native(void *model, DNNInputData *input, const char *input_name, const char **output_names, uint32_t nb_output)
  {
@@ -331,10 +332,6 @@ DNNReturnType ff_dnn_execute_model_native(const DNNModel *model, DNNData *output
  {
      ConvolutionalNetwork *network = (ConvolutionalNetwork *)model->model;
      int32_t layer;
-    ConvolutionalParams *conv_params;
-    DepthToSpaceParams *depth_to_space_params;
-    LayerPadParams *pad_params;
-    DnnLayerMaximumParams *maximum_params;
      uint32_t nb = FFMIN(nb_output, network->nb_output);
  
      if (network->layers_num <= 0 || network->operands_num <= 0)
@@ -343,30 +340,11 @@ DNNReturnType ff_dnn_execute_model_native(const DNNModel *model, DNNData *output
          return DNN_ERROR;
  
      for (layer = 0; layer < network->layers_num; ++layer){
-        switch (network->layers[layer].type){
-        case DLT_CONV2D:
-            conv_params = (ConvolutionalParams *)network->layers[layer].params;
-            convolve(network->operands, network->layers[layer].input_operand_indexes,
-                     network->layers[layer].output_operand_index, conv_params);
-            break;
-        case DLT_DEPTH_TO_SPACE:
-            depth_to_space_params = (DepthToSpaceParams *)network->layers[layer].params;
-            depth_to_space(network->operands, network->layers[layer].input_operand_indexes,
-                           network->layers[layer].output_operand_index, depth_to_space_params->block_size);
-            break;
-        case DLT_MIRROR_PAD:
-            pad_params = (LayerPadParams *)network->layers[layer].params;
-            dnn_execute_layer_pad(network->operands, network->layers[layer].input_operand_indexes,
-                                  network->layers[layer].output_operand_index, pad_params);
-            break;
-        case DLT_MAXIMUM:
-            maximum_params = (DnnLayerMaximumParams *)network->layers[layer].params;
-            dnn_execute_layer_maximum(network->operands, network->layers[layer].input_operand_indexes,
-                                  network->layers[layer].output_operand_index, maximum_params);
-            break;
-        case DLT_INPUT:
-            return DNN_ERROR;
-        }
+        DNNLayerType layer_type = network->layers[layer].type;
+        layer_funcs[layer_type](network->operands,
+                                  network->layers[layer].input_operand_indexes,
+                                  network->layers[layer].output_operand_index,
+                                  network->layers[layer].params);
      }
  
      for (uint32_t i = 0; i < nb; ++i) {
diff --git a/libavfilter/dnn/dnn_backend_native.h b/libavfilter/dnn/dnn_backend_native.h

index 761e5ed02ca1d3c5e7fb552130b6050391a3ae4b..98213901947618c28b3c50b265c035dee58dd4ee 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native.h
+++ b/libavfilter/dnn/dnn_backend_native.h
@@ -33,13 +33,15 @@
  /**
   * the enum value of DNNLayerType should not be changed,
   * the same values are used in convert_from_tensorflow.py
+ * and, it is used to index the layer execution function pointer.
   */
  typedef enum {
      DLT_INPUT = 0,
      DLT_CONV2D = 1,
      DLT_DEPTH_TO_SPACE = 2,
      DLT_MIRROR_PAD = 3,
-    DLT_MAXIMUM = 4
+    DLT_MAXIMUM = 4,
+    DLT_COUNT
  } DNNLayerType;
  
  typedef enum {DOT_INPUT = 1, DOT_OUTPUT = 2, DOT_INTERMEDIATE = DOT_INPUT | DOT_INPUT} DNNOperandType;
diff --git a/libavfilter/dnn/dnn_backend_native_layer_conv2d.c b/libavfilter/dnn/dnn_backend_native_layer_conv2d.c

index b13b4314ec49c9b991d4d47330dbaaed70dbac79..594187f5b13a696dac43cb764b67191af5767618 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native_layer_conv2d.c
+++ b/libavfilter/dnn/dnn_backend_native_layer_conv2d.c
@@ -23,7 +23,8 @@
  
  #define CLAMP_TO_EDGE(x, w) ((x) < 0 ? 0 : ((x) >= (w) ? (w - 1) : (x)))
  
-int convolve(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t output_operand_index, const ConvolutionalParams *conv_params)
+int dnn_execute_layer_conv2d(DnnOperand *operands, const int32_t *input_operand_indexes,
+                             int32_t output_operand_index, const void *parameters)
  {
      float *output;
      int32_t input_operand_index = input_operand_indexes[0];
@@ -32,6 +33,7 @@ int convolve(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t
      int width = operands[input_operand_index].dims[2];
      int channel = operands[input_operand_index].dims[3];
      const float *input = operands[input_operand_index].data;
+    const ConvolutionalParams *conv_params = (const ConvolutionalParams *)parameters;
  
      int radius = conv_params->kernel_size >> 1;
      int src_linesize = width * conv_params->input_num;
diff --git a/libavfilter/dnn/dnn_backend_native_layer_conv2d.h b/libavfilter/dnn/dnn_backend_native_layer_conv2d.h

index 7ddfff38baeb372c81bd23b0bbd8f430d74769f5..1dd84cb8f6db94081ae870e968b03d0375f4c33b 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native_layer_conv2d.h
+++ b/libavfilter/dnn/dnn_backend_native_layer_conv2d.h
@@ -35,5 +35,6 @@ typedef struct ConvolutionalParams{
      float *biases;
  } ConvolutionalParams;
  
-int convolve(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t output_operand_index, const ConvolutionalParams *conv_params);
+int dnn_execute_layer_conv2d(DnnOperand *operands, const int32_t *input_operand_indexes,
+                             int32_t output_operand_index, const void *parameters);
  #endif
diff --git a/libavfilter/dnn/dnn_backend_native_layer_depth2space.c b/libavfilter/dnn/dnn_backend_native_layer_depth2space.c

index a248764681a5078a0cc1e45ab92cf8424075475b..37200607b25c59a76a3959c57588f9d9c60d15d2 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native_layer_depth2space.c
+++ b/libavfilter/dnn/dnn_backend_native_layer_depth2space.c
@@ -27,9 +27,12 @@
  #include "libavutil/avassert.h"
  #include "dnn_backend_native_layer_depth2space.h"
  
-int depth_to_space(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t output_operand_index, int block_size)
+int dnn_execute_layer_depth2space(DnnOperand *operands, const int32_t *input_operand_indexes,
+                                  int32_t output_operand_index, const void *parameters)
  {
      float *output;
+    const DepthToSpaceParams *params = (const DepthToSpaceParams *)parameters;
+    int block_size = params->block_size;
      int32_t input_operand_index = input_operand_indexes[0];
      int number = operands[input_operand_index].dims[0];
      int height = operands[input_operand_index].dims[1];
diff --git a/libavfilter/dnn/dnn_backend_native_layer_depth2space.h b/libavfilter/dnn/dnn_backend_native_layer_depth2space.h

index 8708be83b9b52ae92efef61e127996ab1d89ca0b..c481bf1e5c6e8dea00574c954ba9cfdff1e135f4 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native_layer_depth2space.h
+++ b/libavfilter/dnn/dnn_backend_native_layer_depth2space.h
@@ -34,6 +34,7 @@ typedef struct DepthToSpaceParams{
      int block_size;
  } DepthToSpaceParams;
  
-int depth_to_space(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t output_operand_index, int block_size);
+int dnn_execute_layer_depth2space(DnnOperand *operands, const int32_t *input_operand_indexes,
+                                  int32_t output_operand_index, const void *parameters);
  
  #endif
diff --git a/libavfilter/dnn/dnn_backend_native_layer_maximum.c b/libavfilter/dnn/dnn_backend_native_layer_maximum.c

index a2669af794914b5b91ae57966300f3251d0f34e6..6add170319c8d2312837ecace43a7d00674126da 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native_layer_maximum.c
+++ b/libavfilter/dnn/dnn_backend_native_layer_maximum.c
@@ -27,10 +27,12 @@
  #include "libavutil/avassert.h"
  #include "dnn_backend_native_layer_maximum.h"
  
-int dnn_execute_layer_maximum(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t output_operand_index, const DnnLayerMaximumParams *params)
+int dnn_execute_layer_maximum(DnnOperand *operands, const int32_t *input_operand_indexes,
+                              int32_t output_operand_index, const void *parameters)
  {
      const DnnOperand *input = &operands[input_operand_indexes[0]];
      DnnOperand *output = &operands[output_operand_index];
+    const DnnLayerMaximumParams *params = (const DnnLayerMaximumParams *)parameters;
      int dims_count;
      const float *src;
      float *dst;
diff --git a/libavfilter/dnn/dnn_backend_native_layer_maximum.h b/libavfilter/dnn/dnn_backend_native_layer_maximum.h

index 6396e5818c2a16d6a2e1ccf1b4374888c8a558b6..87f3bf5a800fb835ec872e6f26386010534c6061 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native_layer_maximum.h
+++ b/libavfilter/dnn/dnn_backend_native_layer_maximum.h
@@ -37,6 +37,7 @@ typedef struct DnnLayerMaximumParams{
      }val;
  } DnnLayerMaximumParams;
  
-int dnn_execute_layer_maximum(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t output_operand_index, const DnnLayerMaximumParams *params);
+int dnn_execute_layer_maximum(DnnOperand *operands, const int32_t *input_operand_indexes,
+                              int32_t output_operand_index, const void *parameters);
  
  #endif
diff --git a/libavfilter/dnn/dnn_backend_native_layer_pad.c b/libavfilter/dnn/dnn_backend_native_layer_pad.c

index c2905a75ea4d36bd11a25357b0dfc188a0ce49c2..f5c572728fd81c06277759d525fbb1d4972cb70a 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native_layer_pad.c
+++ b/libavfilter/dnn/dnn_backend_native_layer_pad.c
@@ -48,12 +48,13 @@ static int after_get_buddy(int given, int border, LayerPadModeParam mode)
      }
  }
  
-int dnn_execute_layer_pad(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t output_operand_index,
-                           const LayerPadParams *params)
+int dnn_execute_layer_pad(DnnOperand *operands, const int32_t *input_operand_indexes,
+                          int32_t output_operand_index, const void *parameters)
  {
      int32_t before_paddings;
      int32_t after_paddings;
      float* output;
+    const LayerPadParams *params = (const LayerPadParams *)parameters;
  
      // suppose format is <N, H, W, C>
      int32_t input_operand_index = input_operand_indexes[0];
diff --git a/libavfilter/dnn/dnn_backend_native_layer_pad.h b/libavfilter/dnn/dnn_backend_native_layer_pad.h

index 7cc821352182d0a77e3b495545e1a4fcacfba237..036ff7b86f5a47e8c092acc1ea9bc81fe831b7a4 100644 (file)
--- a/libavfilter/dnn/dnn_backend_native_layer_pad.h
+++ b/libavfilter/dnn/dnn_backend_native_layer_pad.h
@@ -36,7 +36,7 @@ typedef struct LayerPadParams{
      float constant_values;
  } LayerPadParams;
  
-int dnn_execute_layer_pad(DnnOperand *operands, const int32_t *input_operand_indexes, int32_t output_operand_index,
-                           const LayerPadParams *params);
+int dnn_execute_layer_pad(DnnOperand *operands, const int32_t *input_operand_indexes,
+                          int32_t output_operand_index, const void *parameters);
  
  #endif
diff --git a/libavfilter/dnn/dnn_backend_native_layers.c b/libavfilter/dnn/dnn_backend_native_layers.c

new file mode 100644 (file)

index 0000000..17b91bb
--- /dev/null
+++ b/libavfilter/dnn/dnn_backend_native_layers.c
@@ -0,0 +1,34 @@
+/*
+ * Copyright (c) 2019 Guo Yejun
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#include <string.h>
+#include "dnn_backend_native_layers.h"
+#include "dnn_backend_native_layer_pad.h"
+#include "dnn_backend_native_layer_conv2d.h"
+#include "dnn_backend_native_layer_depth2space.h"
+#include "dnn_backend_native_layer_maximum.h"
+
+LAYER_EXEC_FUNC layer_funcs[DLT_COUNT] = {
+    NULL,
+    dnn_execute_layer_conv2d,
+    dnn_execute_layer_depth2space,
+    dnn_execute_layer_pad,
+    dnn_execute_layer_maximum,
+};
diff --git a/libavfilter/dnn/dnn_backend_native_layers.h b/libavfilter/dnn/dnn_backend_native_layers.h

new file mode 100644 (file)

index 0000000..3276aee
--- /dev/null
+++ b/libavfilter/dnn/dnn_backend_native_layers.h
@@ -0,0 +1,32 @@
+/*
+ * Copyright (c) 2019 Guo Yejun
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#ifndef AVFILTER_DNN_DNN_BACKEND_NATIVE_LAYERS_H
+#define AVFILTER_DNN_DNN_BACKEND_NATIVE_LAYERS_H
+
+#include <stdint.h>
+#include "dnn_backend_native.h"
+
+typedef int (*LAYER_EXEC_FUNC)(DnnOperand *operands, const int32_t *input_operand_indexes,
+                               int32_t output_operand_index, const void *parameters);
+
+extern LAYER_EXEC_FUNC layer_funcs[DLT_COUNT];
+
+#endif
diff --git a/tests/dnn/dnn-layer-conv2d-test.c b/tests/dnn/dnn-layer-conv2d-test.c

index afc5391484588677f5b41d502f4b460da3f233cb..9d13da37c83ff75132340b693cb47e51dd5ee3a0 100644 (file)
--- a/tests/dnn/dnn-layer-conv2d-test.c
+++ b/tests/dnn/dnn-layer-conv2d-test.c
@@ -113,7 +113,7 @@ static int test_with_same_dilate(void)
      operands[1].data = NULL;
  
      input_indexes[0] = 0;
-    convolve(operands, input_indexes, 1, &params);
+    dnn_execute_layer_conv2d(operands, input_indexes, 1, &params);
  
      output = operands[1].data;
      for (int i = 0; i < sizeof(expected_output) / sizeof(float); i++) {
@@ -212,7 +212,7 @@ static int test_with_valid(void)
      operands[1].data = NULL;
  
      input_indexes[0] = 0;
-    convolve(operands, input_indexes, 1, &params);
+    dnn_execute_layer_conv2d(operands, input_indexes, 1, &params);
  
      output = operands[1].data;
      for (int i = 0; i < sizeof(expected_output) / sizeof(float); i++) {
diff --git a/tests/dnn/dnn-layer-depth2space-test.c b/tests/dnn/dnn-layer-depth2space-test.c

index 87118de7958b9459f41c6e4d0e286a0678d40425..5225ec7b7ac153932465b8a2084affae479e1ede 100644 (file)
--- a/tests/dnn/dnn-layer-depth2space-test.c
+++ b/tests/dnn/dnn-layer-depth2space-test.c
@@ -48,6 +48,7 @@ static int test(void)
      print(list(output.flatten()))
      */
  
+    DepthToSpaceParams params;
      DnnOperand operands[2];
      int32_t input_indexes[1];
      float input[1*5*3*4] = {
@@ -79,7 +80,8 @@ static int test(void)
      operands[1].data = NULL;
  
      input_indexes[0] = 0;
-    depth_to_space(operands, input_indexes, 1, 2);
+    params.block_size = 2;
+    dnn_execute_layer_depth2space(operands, input_indexes, 1, &params);
  
      output = operands[1].data;
      for (int i = 0; i < sizeof(expected_output) / sizeof(float); i++) {
author	Guo, Yejun <yejun.guo@intel.com>
	Wed, 9 Oct 2019 14:08:11 +0000 (22:08 +0800)
committer	Pedro Arthur <bygrandao@gmail.com>
	Tue, 15 Oct 2019 21:56:25 +0000 (18:56 -0300)
libavfilter/dnn/Makefile		patch \| blob \| history
libavfilter/dnn/dnn_backend_native.c		patch \| blob \| history
libavfilter/dnn/dnn_backend_native.h		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layer_conv2d.c		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layer_conv2d.h		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layer_depth2space.c		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layer_depth2space.h		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layer_maximum.c		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layer_maximum.h		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layer_pad.c		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layer_pad.h		patch \| blob \| history
libavfilter/dnn/dnn_backend_native_layers.c	[new file with mode: 0644]	patch \| blob
libavfilter/dnn/dnn_backend_native_layers.h	[new file with mode: 0644]	patch \| blob
tests/dnn/dnn-layer-conv2d-test.c		patch \| blob \| history
tests/dnn/dnn-layer-depth2space-test.c		patch \| blob \| history