[Backend] Add fp16 support for ONNXRuntime-GPU (#1239)

* add fp16 support for ort-gpu * add enable_ort_fp16 option * fix * fix bugs * use fp16 for test * update code * update code * fix windows bug
2025-10-15 21:20:53 +08:00 · 2023-03-23 18:23:13 +08:00
parent b62912ff9c
commit cae341e6c5
9 changed files with 67 additions and 24 deletions
--- a/fastdeploy/runtime/backends/ort/ort_backend.h
+++ b/fastdeploy/runtime/backends/ort/ort_backend.h
@@ -74,6 +74,10 @@ class OrtBackend : public BaseBackend {
  std::shared_ptr<Ort::IoBinding> binding_;
  std::vector<OrtValueInfo> inputs_desc_;
  std::vector<OrtValueInfo> outputs_desc_;
+
+  // the ONNX model file name,
+  // when ONNX is bigger than 2G, we will set this name
+  std::string model_file_name;
 #ifndef NON_64_PLATFORM
  Ort::CustomOpDomain custom_op_domain_ = Ort::CustomOpDomain("Paddle");
 #endif