Files
FastDeploy/fastdeploy/runtime/backends/openvino/option.h
Ethan Yang 4f48d84c27 [Backend] optimize cpu usage on openvino backend (#1531)
* optimiza cpu usage on openvino backend

conver the hint varible to string

* update with affinity mode set-up

---------

Co-authored-by: Ethan <yicheng@intel.com>
Co-authored-by: Jason <jiangjiajun@baidu.com>
2023-03-17 10:24:25 +08:00

102 lines
2.9 KiB
C++

// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#pragma once
#include "fastdeploy/core/fd_type.h"
#include <iostream>
#include <memory>
#include <string>
#include <vector>
#include <map>
#include <set>
namespace fastdeploy {
/*! @brief Option object to configure OpenVINO backend
*/
struct OpenVINOBackendOption {
std::string device = "CPU";
int cpu_thread_num = -1;
/// Number of streams while use OpenVINO
int num_streams = 1;
/// Affinity mode
std::string affinity = "YES";
/// Performance hint mode
std::string hint = "UNDEFINED";
/**
* @brief Set device name for OpenVINO, default 'CPU', can also be 'AUTO', 'GPU', 'GPU.1'....
*/
void SetDevice(const std::string& name = "CPU") {
device = name;
}
/**
* @brief Set shape info for OpenVINO
*/
void SetShapeInfo(
const std::map<std::string, std::vector<int64_t>>& _shape_infos) {
shape_infos = _shape_infos;
}
/**
* @brief While use OpenVINO backend with intel GPU, use this interface to specify operators run on CPU
*/
void SetCpuOperators(const std::vector<std::string>& operators) {
for (const auto& op : operators) {
cpu_operators.insert(op);
}
}
/**
* @brief Set Affinity mode
*/
void SetAffinity (const std::string& _affinity) {
FDASSERT(_affinity == "YES" || _affinity == "NO" || _affinity == "NUMA" ||
_affinity == "HYBRID_AWARE",
"The affinity mode should be one of the list "
"['YES', 'NO', 'NUMA', "
"'HYBRID_AWARE'] ");
affinity = _affinity;
}
/**
* @brief Set the Performance Hint
*/
void SetPerformanceHint (const std::string& _hint) {
FDASSERT(_hint == "LATENCY" || _hint == "THROUGHPUT" ||
_hint == "CUMULATIVE_THROUGHPUT" || _hint == "UNDEFINED",
"The performance hint should be one of the list "
"['LATENCY', 'THROUGHPUT', 'CUMULATIVE_THROUGHPUT', "
"'UNDEFINED'] ");
hint = _hint;
}
/**
* @brief Set the number of streams
*/
void SetStreamNum (int _num_streams) {
FDASSERT(_num_streams > 0, "The stream_num must be greater than 0.");
num_streams = _num_streams;
}
std::map<std::string, std::vector<int64_t>> shape_infos;
std::set<std::string> cpu_operators{"MulticlassNms"};
};
} // namespace fastdeploy