[Other] Optimize Poros backend (#1232)

* Optimize Poros backend * fix error * Add more pybind * fix conflicts * add some deprecate notices
2025-12-24 13:28:13 +08:00 · 2023-02-07 10:18:03 +08:00
parent f73a538f61
commit 7c9bf11c44
15 changed files with 397 additions and 283 deletions
--- a/python/fastdeploy/runtime.py
+++ b/python/fastdeploy/runtime.py
@@ -147,7 +147,7 @@ class Runtime:
    def get_profile_time(self):
        """Get profile time of Runtime after the profile process is done.
        """
-        return self._runtime.get_profile_time()      
+        return self._runtime.get_profile_time()


 class RuntimeOption:
@@ -160,65 +160,6 @@ class RuntimeOption:

        self._option = C.RuntimeOption()

-    @property
-    def is_dynamic(self):
-        """Only for Poros backend
-
-        :param value: (bool)Whether to enable dynamic shape, default False
-        """
-        return self._option.is_dynamic
-
-    @property
-    def unconst_ops_thres(self):
-        """Only for Poros backend
-
-        :param value: (int)Minimum number of subgraph OPs, default 10
-        """
-        return self._option.unconst_ops_thres
-
-    @property
-    def long_to_int(self):
-        """Only for Poros backend
-
-        :param value: (bool)Whether to convert long dtype to int dtype, default True
-        """
-        return self._option.long_to_int
-
-    @property
-    def use_nvidia_tf32(self):
-        """Only for Poros backend
-
-        :param value: (bool)The calculation accuracy of tf32 mode exists on the A card, which can bring some performance improvements, default False
-        """
-        return self._option.use_nvidia_tf32
-
-    @is_dynamic.setter
-    def is_dynamic(self, value):
-        assert isinstance(
-            value, bool), "The value to set `is_dynamic` must be type of bool."
-        self._option.is_dynamic = value
-
-    @unconst_ops_thres.setter
-    def unconst_ops_thres(self, value):
-        assert isinstance(
-            value,
-            int), "The value to set `unconst_ops_thres` must be type of int."
-        self._option.unconst_ops_thres = value
-
-    @long_to_int.setter
-    def long_to_int(self, value):
-        assert isinstance(
-            value,
-            bool), "The value to set `long_to_int` must be type of bool."
-        self._option.long_to_int = value
-
-    @use_nvidia_tf32.setter
-    def use_nvidia_tf32(self, value):
-        assert isinstance(
-            value,
-            bool), "The value to set `use_nvidia_tf32` must be type of bool."
-        self._option.use_nvidia_tf32 = value
-
    def set_model_path(self,
                       model_path,
                       params_path="",
@@ -322,6 +263,9 @@ class RuntimeOption:

        :param level: (int)Optimization level, -1 means the default setting
        """
+        logging.warning(
+            "`RuntimeOption.set_ort_graph_opt_level` will be deprecated in v1.2.0, please use `RuntimeOption.graph_optimize_level = 99` instead."
+        )
        return self._option.set_ort_graph_opt_level(level)

    def use_paddle_backend(self):
@@ -364,29 +308,36 @@ class RuntimeOption:
        """
        return self.use_lite_backend()

-    def set_lite_device_names(self, device_names):
-        """Set nnadapter device name for Paddle Lite backend.
-        """
-        return self._option.set_lite_device_names(device_names)
-
    def set_lite_context_properties(self, context_properties):
        """Set nnadapter context properties for Paddle Lite backend.
        """
+        logging.warning(
+            "`RuntimeOption.set_lite_context_properties` will be deprecated in v1.2.0, please use `RuntimeOption.paddle_lite_option.nnadapter_context_properties = ...` instead."
+        )
        return self._option.set_lite_context_properties(context_properties)

    def set_lite_model_cache_dir(self, model_cache_dir):
        """Set nnadapter model cache dir for Paddle Lite backend.
        """
+        logging.warning(
+            "`RuntimeOption.set_lite_model_cache_dir` will be deprecated in v1.2.0, please use `RuntimeOption.paddle_lite_option.nnadapter_model_cache_dir = ...` instead."
+        )
        return self._option.set_lite_model_cache_dir(model_cache_dir)

    def set_lite_dynamic_shape_info(self, dynamic_shape_info):
        """ Set nnadapter dynamic shape info for Paddle Lite backend.
        """
+        logging.warning(
+            "`RuntimeOption.set_lite_dynamic_shape_info` will be deprecated in v1.2.0, please use `RuntimeOption.paddle_lite_option.nnadapter_dynamic_shape_info = ...` instead."
+        )
        return self._option.set_lite_dynamic_shape_info(dynamic_shape_info)

    def set_lite_subgraph_partition_path(self, subgraph_partition_path):
        """ Set nnadapter subgraph partition path for Paddle Lite backend.
        """
+        logging.warning(
+            "`RuntimeOption.set_lite_subgraph_partition_path` will be deprecated in v1.2.0, please use `RuntimeOption.paddle_lite_option.nnadapter_subgraph_partition_config_path = ...` instead."
+        )
        return self._option.set_lite_subgraph_partition_path(
            subgraph_partition_path)

@@ -394,6 +345,9 @@ class RuntimeOption:
                                                  subgraph_partition_buffer):
        """ Set nnadapter subgraph partition buffer for Paddle Lite backend.
        """
+        logging.warning(
+            "`RuntimeOption.set_lite_subgraph_partition_buffer` will be deprecated in v1.2.0, please use `RuntimeOption.paddle_lite_option.nnadapter_subgraph_partition_config_buffer = ...` instead."
+        )
        return self._option.set_lite_subgraph_partition_config_buffer(
            subgraph_partition_buffer)

@@ -401,6 +355,9 @@ class RuntimeOption:
            self, mixed_precision_quantization_config_path):
        """ Set nnadapter mixed precision quantization config path for Paddle Lite backend..
        """
+        logging.warning(
+            "`RuntimeOption.set_lite_mixed_precision_quantization_config_path` will be deprecated in v1.2.0, please use `RuntimeOption.paddle_lite_option.nnadapter_mixed_precision_quantization_config_path = ...` instead."
+        )
        return self._option.set_lite_mixed_precision_quantization_config_path(
            mixed_precision_quantization_config_path)

@@ -411,21 +368,33 @@ class RuntimeOption:

    def set_openvino_device(self, name="CPU"):
        """Set device name for OpenVINO, default 'CPU', can also be 'AUTO', 'GPU', 'GPU.1'....
+           This interface is deprecated, please use `RuntimeOption.openvino_option.set_device` instead.
        """
+        logging.warning(
+            "`RuntimeOption.set_openvino_device` will be deprecated in v1.2.0, please use `RuntimeOption.openvino_option.set_device` instead."
+        )
        return self._option.set_openvino_device(name)

    def set_openvino_shape_info(self, shape_info):
        """Set shape information of the models' inputs, used for GPU to fix the shape
+           This interface is deprecated, please use `RuntimeOption.openvino_option.set_shape_info` instead.

        :param shape_info: (dict{str, list of int})Shape information of model's inputs, e.g {"image": [1, 3, 640, 640], "scale_factor": [1, 2]}
        """
+        logging.warning(
+            "`RuntimeOption.set_openvino_shape_info` will be deprecated in v1.2.0, please use `RuntimeOption.openvino_option.set_shape_info` instead."
+        )
        return self._option.set_openvino_shape_info(shape_info)

    def set_openvino_cpu_operators(self, operators):
        """While using OpenVINO backend and intel GPU, this interface specifies unsupported operators to run on CPU
+           This interface is deprecated, please use `RuntimeOption.openvino_option.set_cpu_operators` instead.

        :param operators: (list of string)list of operators' name, e.g ["MulticlasNms"]
        """
+        logging.warning(
+            "`RuntimeOption.set_openvino_cpu_operators` will be deprecated in v1.2.0, please use `RuntimeOption.openvino_option.set_cpu_operators` instead."
+        )
        return self._option.set_openvino_cpu_operators(operators)

    def enable_paddle_log_info(self):
@@ -557,15 +526,45 @@ class RuntimeOption:
                                           available_memory_proportion,
                                           enable_half_partial)

-    def enable_profiling(self, 
-                         inclue_h2d_d2h=False,
-                         repeat=100, warmup=50):
+    @property
+    def poros_option(self):
+        """Get PorosBackendOption object to configure Poros backend
+
+        :return PorosBackendOption
+        """
+        return self._option.poros_option
+
+    @property
+    def paddle_lite_option(self):
+        """Get LiteBackendOption object to configure Paddle Lite backend
+
+        :return LiteBackendOption
+        """
+        return self._option.paddle_lite_option
+
+    @property
+    def openvino_option(self):
+        """Get OpenVINOOption object to configure OpenVINO backend
+
+        :return OpenVINOOption
+        """
+        return self._option.openvino_option
+
+    @property
+    def ort_option(self):
+        """Get OrtBackendOption object to configure ONNX Runtime backend
+
+        :return OrtBackendOption
+        """
+        return self._option.ort_option
+
+    def enable_profiling(self, inclue_h2d_d2h=False, repeat=100, warmup=50):
        """Set the profile mode as 'true'.
        :param inclue_h2d_d2h Whether to include time of H2D_D2H for time of runtime.
        :param repeat Repeat times for runtime inference.
        :param warmup Warmup times for runtime inference.
-        """                 
-        return self._option.enable_profiling(inclue_h2d_d2h, repeat, warmup)   
+        """
+        return self._option.enable_profiling(inclue_h2d_d2h, repeat, warmup)

    def disable_profiling(self):
        """Set the profile mode as 'false'.
@@ -580,8 +579,7 @@ class RuntimeOption:
                continue
            if hasattr(getattr(self._option, attr), "__call__"):
                continue
-            message += "  {} : {}\t\n".format(attr,
-                                              getattr(self._option, attr))
+            message += "  {} : {}\t\n".format(attr, getattr(self._option, attr))
        message.strip("\n")
        message += ")"
        return message