[Serving][Backend] Backend support zero_copy_infer and Serving reduce the output memory copy (#703)

* backend add zero copy infer interface * fix bug * fix bug * fix bug * paddle ipu
2025-10-06 09:07:10 +08:00 · 2022-11-28 14:07:53 +08:00
parent edcf150d33
commit 42f1888bb0
21 changed files with 254 additions and 109 deletions
--- a/fastdeploy/backends/lite/lite_backend.cc
+++ b/fastdeploy/backends/lite/lite_backend.cc
@@ -187,7 +187,8 @@ TensorInfo LiteBackend::GetOutputInfo(int index) {
 std::vector<TensorInfo> LiteBackend::GetOutputInfos() { return outputs_desc_; }

 bool LiteBackend::Infer(std::vector<FDTensor>& inputs,
-                        std::vector<FDTensor>* outputs) {                                                
+                        std::vector<FDTensor>* outputs,
+                        bool copy_to_fd) {                                                
  if (inputs.size() != inputs_desc_.size()) {
    FDERROR << "[LiteBackend] Size of inputs(" << inputs.size()
            << ") should keep same with the inputs of this model("