[Serving][Backend] Backend support zero_copy_infer and Serving reduce the output memory copy (#703)

* backend add zero copy infer interface * fix bug * fix bug * fix bug * paddle ipu
2025-10-06 09:07:10 +08:00 · 2022-11-28 14:07:53 +08:00
parent edcf150d33
commit 42f1888bb0
21 changed files with 254 additions and 109 deletions
--- a/fastdeploy/backends/lite/lite_backend.h
+++ b/fastdeploy/backends/lite/lite_backend.h
@@ -60,7 +60,9 @@ class LiteBackend : public BaseBackend {
                      const std::string& params_file,
                      const LiteBackendOption& option = LiteBackendOption());

-  bool Infer(std::vector<FDTensor>& inputs, std::vector<FDTensor>* outputs) override; // NOLINT
+  bool Infer(std::vector<FDTensor>& inputs,
+            std::vector<FDTensor>* outputs,
+            bool copy_to_fd = true) override; // NOLINT

  int NumInputs() const override { return inputs_desc_.size(); }