Files
FastDeploy/benchmark/cpp/flags.h
WJJ1995 11dd2512c5 [Benchmark] Add all backend config (#1587)
* add GPL lisence

* add GPL-3.0 lisence

* add GPL-3.0 lisence

* add GPL-3.0 lisence

* support yolov8

* add pybind for yolov8

* add yolov8 readme

* add cpp benchmark

* add cpu and gpu mem

* public part split

* add runtime mode

* fixed bugs

* add cpu_thread_nums

* deal with comments

* deal with comments

* deal with comments

* rm useless code

* add FASTDEPLOY_DECL

* add FASTDEPLOY_DECL

* fixed for windows

* mv rss to pss

* mv rss to pss

* Update utils.cc

* use thread to collect mem

* Add ResourceUsageMonitor

* rm useless code

* fixed bug

* fixed typo

* update ResourceUsageMonitor

* fixed bug

* fixed bug

* add note for ResourceUsageMonitor

* deal with comments

* add macros

* deal with comments

* deal with comments

* deal with comments

* re-lint

* rm pmap and use mem api

* rm pmap and use mem api

* add mem api

* Add PrintBenchmarkInfo func

* Add PrintBenchmarkInfo func

* Add PrintBenchmarkInfo func

* deal with comments

* fixed enable_paddle_to_trt

* add log for paddle_trt

* support ppcls benchmark

* use new trt option api

* update benchmark info

* simplify benchmark.cc

* simplify benchmark.cc

* deal with comments

* Add ppseg && ppocr benchmark

* add OCR rec img

* add ocr benchmark

* fixed trt shape

* add trt shape

* resolve conflict

* add ENABLE_BENCHMARK define

* Add ClassifyDiff

* Add Resize for ClassifyResult

* deal with comments

* add convert info script

* resolve conflict

* Add SaveBenchmarkResult func

* fixed bug

* fixed bug

* fixed bug

* add config.txt for option

* fixed bug

* fixed bug

* fixed bug

* add benchmark.sh

* mv thread_nums from 8 to 1

* deal with comments

* deal with comments

* fixed readme

* deal with comments

* add all platform shell

* Update config.arm.txt

* Update config.gpu.txt

* Update config.x86.txt

* fixed printinfo bug

* rm proxy

* add more model support

* all backend config.txt

* deal with comments

---------

Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com>
2023-03-13 15:36:30 +08:00

94 lines
3.5 KiB
C++
Executable File

// Copyright (c) 2023 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#pragma once
#include <unordered_map>
#include "gflags/gflags.h"
#include "fastdeploy/benchmark/utils.h"
#ifdef WIN32
static const char sep = '\\';
#else
static const char sep = '/';
#endif
DEFINE_string(model, "", "Directory of the inference model.");
DEFINE_string(image, "", "Path of the image file.");
DEFINE_string(config_path, "config.txt", "Path of benchmark config.");
DEFINE_int32(warmup, -1, "Number of warmup for profiling.");
DEFINE_int32(repeat, -1, "Number of repeats for profiling.");
static void PrintUsage() {
std::cout << "Usage: infer_demo --model model_path --image img_path "
"--config_path config.txt[Path of benchmark config.] "
<< std::endl;
std::cout << "Default value of device: cpu" << std::endl;
std::cout << "Default value of backend: default" << std::endl;
std::cout << "Default value of use_fp16: false" << std::endl;
}
static void PrintBenchmarkInfo(std::unordered_map<std::string,
std::string> config_info) {
#if defined(ENABLE_BENCHMARK) && defined(ENABLE_VISION)
// Get model name
std::vector<std::string> model_names;
fastdeploy::benchmark::Split(FLAGS_model, model_names, sep);
if (model_names.empty()) {
std::cout << "Directory of the inference model is invalid!!!" << std::endl;
return;
}
// Save benchmark info
int warmup = std::stoi(config_info["warmup"]);
int repeat = std::stoi(config_info["repeat"]);
if (FLAGS_warmup != -1) {
warmup = FLAGS_warmup;
}
if (FLAGS_repeat != -1) {
repeat = FLAGS_repeat;
}
std::stringstream ss;
ss.precision(3);
ss << "\n======= Model Info =======\n";
ss << "model_name: " << model_names[model_names.size() - 1] << std::endl;
ss << "profile_mode: " << config_info["profile_mode"] << std::endl;
if (config_info["profile_mode"] == "runtime") {
ss << "include_h2d_d2h: " << config_info["include_h2d_d2h"] << std::endl;
}
ss << "\n======= Backend Info =======\n";
ss << "warmup: " << warmup << std::endl;
ss << "repeats: " << repeat << std::endl;
ss << "device: " << config_info["device"] << std::endl;
if (config_info["device"] == "gpu") {
ss << "device_id: " << config_info["device_id"] << std::endl;
}
ss << "use_fp16: " << config_info["use_fp16"] << std::endl;
ss << "backend: " << config_info["backend"] << std::endl;
if (config_info["device"] == "cpu") {
ss << "cpu_thread_nums: " << config_info["cpu_thread_nums"] << std::endl;
}
ss << "collect_memory_info: "
<< config_info["collect_memory_info"] << std::endl;
if (config_info["collect_memory_info"] == "true") {
ss << "sampling_interval: " << config_info["sampling_interval"]
<< "ms" << std::endl;
}
std::cout << ss.str() << std::endl;
// Save benchmark info
fastdeploy::benchmark::ResultManager::SaveBenchmarkResult(ss.str(),
config_info["result_path"]);
#endif
return;
}