mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-15 21:20:53 +08:00
[Backend] Add fp16 support for ONNXRuntime-GPU (#1239)
* add fp16 support for ort-gpu * add enable_ort_fp16 option * fix * fix bugs * use fp16 for test * update code * update code * fix windows bug
This commit is contained in:
4
fastdeploy/runtime/backends/ort/ort_backend.h
Normal file → Executable file
4
fastdeploy/runtime/backends/ort/ort_backend.h
Normal file → Executable file
@@ -74,6 +74,10 @@ class OrtBackend : public BaseBackend {
|
||||
std::shared_ptr<Ort::IoBinding> binding_;
|
||||
std::vector<OrtValueInfo> inputs_desc_;
|
||||
std::vector<OrtValueInfo> outputs_desc_;
|
||||
|
||||
// the ONNX model file name,
|
||||
// when ONNX is bigger than 2G, we will set this name
|
||||
std::string model_file_name;
|
||||
#ifndef NON_64_PLATFORM
|
||||
Ort::CustomOpDomain custom_op_domain_ = Ort::CustomOpDomain("Paddle");
|
||||
#endif
|
||||
|
Reference in New Issue
Block a user