mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-06 00:57:33 +08:00

* first commit for yolov7 * pybind for yolov7 * CPP README.md * CPP README.md * modified yolov7.cc * README.md * python file modify * delete license in fastdeploy/ * repush the conflict part * README.md modified * README.md modified * file path modified * file path modified * file path modified * file path modified * file path modified * README modified * README modified * move some helpers to private * add examples for yolov7 * api.md modified * api.md modified * api.md modified * YOLOv7 * yolov7 release link * yolov7 release link * yolov7 release link * copyright * change some helpers to private * change variables to const and fix documents. * gitignore * Transfer some funtions to private member of class * Transfer some funtions to private member of class * Merge from develop (#9) * Fix compile problem in different python version (#26) * fix some usage problem in linux * Fix compile problem Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> * Add PaddleDetetion/PPYOLOE model support (#22) * add ppdet/ppyoloe * Add demo code and documents * add convert processor to vision (#27) * update .gitignore * Added checking for cmake include dir * fixed missing trt_backend option bug when init from trt * remove un-need data layout and add pre-check for dtype * changed RGB2BRG to BGR2RGB in ppcls model * add model_zoo yolov6 c++/python demo * fixed CMakeLists.txt typos * update yolov6 cpp/README.md * add yolox c++/pybind and model_zoo demo * move some helpers to private * fixed CMakeLists.txt typos * add normalize with alpha and beta * add version notes for yolov5/yolov6/yolox * add copyright to yolov5.cc * revert normalize * fixed some bugs in yolox * fixed examples/CMakeLists.txt to avoid conflicts * add convert processor to vision * format examples/CMakeLists summary * Fix bug while the inference result is empty with YOLOv5 (#29) * Add multi-label function for yolov5 * Update README.md Update doc * Update fastdeploy_runtime.cc fix variable option.trt_max_shape wrong name * Update runtime_option.md Update resnet model dynamic shape setting name from images to x * Fix bug when inference result boxes are empty * Delete detection.py Co-authored-by: Jason <jiangjiajun@baidu.com> Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com> Co-authored-by: huangjianhui <852142024@qq.com> * first commit for yolor * for merge * Develop (#11) * Fix compile problem in different python version (#26) * fix some usage problem in linux * Fix compile problem Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> * Add PaddleDetetion/PPYOLOE model support (#22) * add ppdet/ppyoloe * Add demo code and documents * add convert processor to vision (#27) * update .gitignore * Added checking for cmake include dir * fixed missing trt_backend option bug when init from trt * remove un-need data layout and add pre-check for dtype * changed RGB2BRG to BGR2RGB in ppcls model * add model_zoo yolov6 c++/python demo * fixed CMakeLists.txt typos * update yolov6 cpp/README.md * add yolox c++/pybind and model_zoo demo * move some helpers to private * fixed CMakeLists.txt typos * add normalize with alpha and beta * add version notes for yolov5/yolov6/yolox * add copyright to yolov5.cc * revert normalize * fixed some bugs in yolox * fixed examples/CMakeLists.txt to avoid conflicts * add convert processor to vision * format examples/CMakeLists summary * Fix bug while the inference result is empty with YOLOv5 (#29) * Add multi-label function for yolov5 * Update README.md Update doc * Update fastdeploy_runtime.cc fix variable option.trt_max_shape wrong name * Update runtime_option.md Update resnet model dynamic shape setting name from images to x * Fix bug when inference result boxes are empty * Delete detection.py Co-authored-by: Jason <jiangjiajun@baidu.com> Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com> Co-authored-by: huangjianhui <852142024@qq.com> * Yolor (#16) * Develop (#11) (#12) * Fix compile problem in different python version (#26) * fix some usage problem in linux * Fix compile problem Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> * Add PaddleDetetion/PPYOLOE model support (#22) * add ppdet/ppyoloe * Add demo code and documents * add convert processor to vision (#27) * update .gitignore * Added checking for cmake include dir * fixed missing trt_backend option bug when init from trt * remove un-need data layout and add pre-check for dtype * changed RGB2BRG to BGR2RGB in ppcls model * add model_zoo yolov6 c++/python demo * fixed CMakeLists.txt typos * update yolov6 cpp/README.md * add yolox c++/pybind and model_zoo demo * move some helpers to private * fixed CMakeLists.txt typos * add normalize with alpha and beta * add version notes for yolov5/yolov6/yolox * add copyright to yolov5.cc * revert normalize * fixed some bugs in yolox * fixed examples/CMakeLists.txt to avoid conflicts * add convert processor to vision * format examples/CMakeLists summary * Fix bug while the inference result is empty with YOLOv5 (#29) * Add multi-label function for yolov5 * Update README.md Update doc * Update fastdeploy_runtime.cc fix variable option.trt_max_shape wrong name * Update runtime_option.md Update resnet model dynamic shape setting name from images to x * Fix bug when inference result boxes are empty * Delete detection.py Co-authored-by: Jason <jiangjiajun@baidu.com> Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com> Co-authored-by: huangjianhui <852142024@qq.com> Co-authored-by: Jason <jiangjiajun@baidu.com> Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com> Co-authored-by: huangjianhui <852142024@qq.com> * Develop (#13) * Fix compile problem in different python version (#26) * fix some usage problem in linux * Fix compile problem Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> * Add PaddleDetetion/PPYOLOE model support (#22) * add ppdet/ppyoloe * Add demo code and documents * add convert processor to vision (#27) * update .gitignore * Added checking for cmake include dir * fixed missing trt_backend option bug when init from trt * remove un-need data layout and add pre-check for dtype * changed RGB2BRG to BGR2RGB in ppcls model * add model_zoo yolov6 c++/python demo * fixed CMakeLists.txt typos * update yolov6 cpp/README.md * add yolox c++/pybind and model_zoo demo * move some helpers to private * fixed CMakeLists.txt typos * add normalize with alpha and beta * add version notes for yolov5/yolov6/yolox * add copyright to yolov5.cc * revert normalize * fixed some bugs in yolox * fixed examples/CMakeLists.txt to avoid conflicts * add convert processor to vision * format examples/CMakeLists summary * Fix bug while the inference result is empty with YOLOv5 (#29) * Add multi-label function for yolov5 * Update README.md Update doc * Update fastdeploy_runtime.cc fix variable option.trt_max_shape wrong name * Update runtime_option.md Update resnet model dynamic shape setting name from images to x * Fix bug when inference result boxes are empty * Delete detection.py Co-authored-by: Jason <jiangjiajun@baidu.com> Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com> Co-authored-by: huangjianhui <852142024@qq.com> * documents * documents * documents * documents * documents * documents * documents * documents * documents * documents * documents * documents * Develop (#14) * Fix compile problem in different python version (#26) * fix some usage problem in linux * Fix compile problem Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> * Add PaddleDetetion/PPYOLOE model support (#22) * add ppdet/ppyoloe * Add demo code and documents * add convert processor to vision (#27) * update .gitignore * Added checking for cmake include dir * fixed missing trt_backend option bug when init from trt * remove un-need data layout and add pre-check for dtype * changed RGB2BRG to BGR2RGB in ppcls model * add model_zoo yolov6 c++/python demo * fixed CMakeLists.txt typos * update yolov6 cpp/README.md * add yolox c++/pybind and model_zoo demo * move some helpers to private * fixed CMakeLists.txt typos * add normalize with alpha and beta * add version notes for yolov5/yolov6/yolox * add copyright to yolov5.cc * revert normalize * fixed some bugs in yolox * fixed examples/CMakeLists.txt to avoid conflicts * add convert processor to vision * format examples/CMakeLists summary * Fix bug while the inference result is empty with YOLOv5 (#29) * Add multi-label function for yolov5 * Update README.md Update doc * Update fastdeploy_runtime.cc fix variable option.trt_max_shape wrong name * Update runtime_option.md Update resnet model dynamic shape setting name from images to x * Fix bug when inference result boxes are empty * Delete detection.py Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com> Co-authored-by: huangjianhui <852142024@qq.com> Co-authored-by: Jason <jiangjiajun@baidu.com> Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com> Co-authored-by: huangjianhui <852142024@qq.com> Co-authored-by: Jason <928090362@qq.com> * add is_dynamic for YOLO series (#22) * modify ppmatting backend and docs * modify ppmatting docs * fix the PPMatting size problem * fix LimitShort's log * retrigger ci * modify PPMatting docs * modify the way for dealing with LimitShort * add python comments for external models * modify resnet c++ comments * modify C++ comments for external models * modify python comments and add result class comments * fix comments compile error * modify result.h comments * modify examples doc and code for SR models * code style * retrigger ci * python file code style * fix examples links * fix examples links * fix examples links Co-authored-by: Jason <jiangjiajun@baidu.com> Co-authored-by: root <root@bjyz-sys-gpu-kongming3.bjyz.baidu.com> Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com> Co-authored-by: huangjianhui <852142024@qq.com> Co-authored-by: Jason <928090362@qq.com>
293 lines
9.5 KiB
C++
293 lines
9.5 KiB
C++
// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#include "fastdeploy/vision.h"
|
|
|
|
#ifdef WIN32
|
|
const char sep = '\\';
|
|
#else
|
|
const char sep = '/';
|
|
#endif
|
|
|
|
void CpuInfer(const std::string& model_dir, const std::string& video_file,
|
|
int frame_num) {
|
|
auto model_file = model_dir + sep + "model.pdmodel";
|
|
auto params_file = model_dir + sep + "model.pdiparams";
|
|
auto model = fastdeploy::vision::sr::PPMSVSR(model_file, params_file);
|
|
|
|
if (!model.Initialized()) {
|
|
std::cerr << "Failed to initialize." << std::endl;
|
|
return;
|
|
}
|
|
// note: input/output shape is [b, n, c, h, w] (n = frame_nums; b=1(default))
|
|
// b and n is dependent on export model shape
|
|
// see
|
|
// https://github.com/PaddlePaddle/PaddleGAN/blob/develop/docs/zh_CN/tutorials/video_super_resolution.md
|
|
cv::VideoCapture capture;
|
|
// change your save video path
|
|
std::string video_out_name = "output.mp4";
|
|
capture.open(video_file);
|
|
if (!capture.isOpened()) {
|
|
std::cout << "can not open video " << std::endl;
|
|
return;
|
|
}
|
|
// Get Video info :fps, frame count
|
|
// it used 4.x version of opencv below
|
|
// notice your opencv version and method of api.
|
|
int video_fps = static_cast<int>(capture.get(cv::CAP_PROP_FPS));
|
|
int video_frame_count =
|
|
static_cast<int>(capture.get(cv::CAP_PROP_FRAME_COUNT));
|
|
// Set fixed size for output frame, only for msvsr model
|
|
int out_width = 1280;
|
|
int out_height = 720;
|
|
std::cout << "fps: " << video_fps << "\tframe_count: " << video_frame_count
|
|
<< std::endl;
|
|
|
|
// Create VideoWriter for output
|
|
cv::VideoWriter video_out;
|
|
std::string video_out_path("./");
|
|
video_out_path += video_out_name;
|
|
int fcc = cv::VideoWriter::fourcc('m', 'p', '4', 'v');
|
|
video_out.open(video_out_path, fcc, video_fps,
|
|
cv::Size(out_width, out_height), true);
|
|
if (!video_out.isOpened()) {
|
|
std::cout << "create video writer failed!" << std::endl;
|
|
return;
|
|
}
|
|
// Capture all frames and do inference
|
|
cv::Mat frame;
|
|
int frame_id = 0;
|
|
bool reach_end = false;
|
|
while (capture.isOpened()) {
|
|
std::vector<cv::Mat> imgs;
|
|
for (int i = 0; i < frame_num; i++) {
|
|
capture.read(frame);
|
|
if (!frame.empty()) {
|
|
imgs.push_back(frame);
|
|
} else {
|
|
reach_end = true;
|
|
}
|
|
}
|
|
if (reach_end) {
|
|
break;
|
|
}
|
|
std::vector<cv::Mat> results;
|
|
model.Predict(imgs, results);
|
|
for (auto& item : results) {
|
|
// cv::imshow("13",item);
|
|
// cv::waitKey(30);
|
|
video_out.write(item);
|
|
std::cout << "Processing frame: " << frame_id << std::endl;
|
|
frame_id += 1;
|
|
}
|
|
}
|
|
std::cout << "inference finished, output video saved at " << video_out_path
|
|
<< std::endl;
|
|
capture.release();
|
|
video_out.release();
|
|
}
|
|
|
|
void GpuInfer(const std::string& model_dir, const std::string& video_file,
|
|
int frame_num) {
|
|
auto model_file = model_dir + sep + "model.pdmodel";
|
|
auto params_file = model_dir + sep + "model.pdiparams";
|
|
|
|
auto option = fastdeploy::RuntimeOption();
|
|
// use paddle-TRT
|
|
option.UseGpu();
|
|
auto model = fastdeploy::vision::sr::PPMSVSR(model_file, params_file, option);
|
|
|
|
if (!model.Initialized()) {
|
|
std::cerr << "Failed to initialize." << std::endl;
|
|
return;
|
|
}
|
|
// note: input/output shape is [b, n, c, h, w] (n = frame_nums; b=1(default))
|
|
// b and n is dependent on export model shape
|
|
// see
|
|
// https://github.com/PaddlePaddle/PaddleGAN/blob/develop/docs/zh_CN/tutorials/video_super_resolution.md
|
|
cv::VideoCapture capture;
|
|
// change your save video path
|
|
std::string video_out_name = "output.mp4";
|
|
capture.open(video_file);
|
|
if (!capture.isOpened()) {
|
|
std::cout << "can not open video " << std::endl;
|
|
return;
|
|
}
|
|
// Get Video info :fps, frame count
|
|
int video_fps = static_cast<int>(capture.get(cv::CAP_PROP_FPS));
|
|
int video_frame_count =
|
|
static_cast<int>(capture.get(cv::CAP_PROP_FRAME_COUNT));
|
|
// Set fixed size for output frame, only for msvsr model
|
|
int out_width = 1280;
|
|
int out_height = 720;
|
|
std::cout << "fps: " << video_fps << "\tframe_count: " << video_frame_count
|
|
<< std::endl;
|
|
|
|
// Create VideoWriter for output
|
|
cv::VideoWriter video_out;
|
|
std::string video_out_path("./");
|
|
video_out_path += video_out_name;
|
|
int fcc = cv::VideoWriter::fourcc('m', 'p', '4', 'v');
|
|
video_out.open(video_out_path, fcc, video_fps,
|
|
cv::Size(out_width, out_height), true);
|
|
if (!video_out.isOpened()) {
|
|
std::cout << "create video writer failed!" << std::endl;
|
|
return;
|
|
}
|
|
// Capture all frames and do inference
|
|
cv::Mat frame;
|
|
int frame_id = 0;
|
|
bool reach_end = false;
|
|
while (capture.isOpened()) {
|
|
std::vector<cv::Mat> imgs;
|
|
for (int i = 0; i < frame_num; i++) {
|
|
capture.read(frame);
|
|
if (!frame.empty()) {
|
|
imgs.push_back(frame);
|
|
} else {
|
|
reach_end = true;
|
|
}
|
|
}
|
|
if (reach_end) {
|
|
break;
|
|
}
|
|
std::vector<cv::Mat> results;
|
|
model.Predict(imgs, results);
|
|
for (auto& item : results) {
|
|
// cv::imshow("13",item);
|
|
// cv::waitKey(30);
|
|
video_out.write(item);
|
|
std::cout << "Processing frame: " << frame_id << std::endl;
|
|
frame_id += 1;
|
|
}
|
|
}
|
|
std::cout << "inference finished, output video saved at " << video_out_path
|
|
<< std::endl;
|
|
capture.release();
|
|
video_out.release();
|
|
}
|
|
|
|
void TrtInfer(const std::string& model_dir, const std::string& video_file,
|
|
int frame_num) {
|
|
auto model_file = model_dir + sep + "model.pdmodel";
|
|
auto params_file = model_dir + sep + "model.pdiparams";
|
|
auto option = fastdeploy::RuntimeOption();
|
|
option.UseGpu();
|
|
option.UseTrtBackend();
|
|
option.EnablePaddleTrtCollectShape();
|
|
option.SetTrtInputShape("lqs", {1, 2, 3, 180, 320});
|
|
option.EnablePaddleToTrt();
|
|
auto model = fastdeploy::vision::sr::PPMSVSR(model_file, params_file, option);
|
|
|
|
if (!model.Initialized()) {
|
|
std::cerr << "Failed to initialize." << std::endl;
|
|
return;
|
|
}
|
|
|
|
// note: input/output shape is [b, n, c, h, w] (n = frame_nums; b=1(default))
|
|
// b and n is dependent on export model shape
|
|
// see
|
|
// https://github.com/PaddlePaddle/PaddleGAN/blob/develop/docs/zh_CN/tutorials/video_super_resolution.md
|
|
cv::VideoCapture capture;
|
|
// change your save video path
|
|
std::string video_out_name = "output.mp4";
|
|
capture.open(video_file);
|
|
if (!capture.isOpened()) {
|
|
std::cout << "can not open video " << std::endl;
|
|
return;
|
|
}
|
|
// Get Video info :fps, frame count
|
|
int video_fps = static_cast<int>(capture.get(cv::CAP_PROP_FPS));
|
|
int video_frame_count =
|
|
static_cast<int>(capture.get(cv::CAP_PROP_FRAME_COUNT));
|
|
// Set fixed size for output frame, only for msvsr model
|
|
// Note that the resolution between the size and the original input is
|
|
// consistent when the model is exported,
|
|
// for example: [1,2,3,180,320], after 4x super separation [1,2,3,720,1080].
|
|
// Therefore, it is very important to derive the model
|
|
int out_width = 1280;
|
|
int out_height = 720;
|
|
std::cout << "fps: " << video_fps << "\tframe_count: " << video_frame_count
|
|
<< std::endl;
|
|
|
|
// Create VideoWriter for output
|
|
cv::VideoWriter video_out;
|
|
std::string video_out_path("./");
|
|
video_out_path += video_out_name;
|
|
int fcc = cv::VideoWriter::fourcc('m', 'p', '4', 'v');
|
|
video_out.open(video_out_path, fcc, video_fps,
|
|
cv::Size(out_width, out_height), true);
|
|
if (!video_out.isOpened()) {
|
|
std::cout << "create video writer failed!" << std::endl;
|
|
return;
|
|
}
|
|
// Capture all frames and do inference
|
|
cv::Mat frame;
|
|
int frame_id = 0;
|
|
bool reach_end = false;
|
|
while (capture.isOpened()) {
|
|
std::vector<cv::Mat> imgs;
|
|
for (int i = 0; i < frame_num; i++) {
|
|
capture.read(frame);
|
|
if (!frame.empty()) {
|
|
imgs.push_back(frame);
|
|
} else {
|
|
reach_end = true;
|
|
}
|
|
}
|
|
if (reach_end) {
|
|
break;
|
|
}
|
|
std::vector<cv::Mat> results;
|
|
model.Predict(imgs, results);
|
|
for (auto& item : results) {
|
|
// cv::imshow("13",item);
|
|
// cv::waitKey(30);
|
|
video_out.write(item);
|
|
std::cout << "Processing frame: " << frame_id << std::endl;
|
|
frame_id += 1;
|
|
}
|
|
}
|
|
std::cout << "inference finished, output video saved at " << video_out_path
|
|
<< std::endl;
|
|
capture.release();
|
|
video_out.release();
|
|
}
|
|
|
|
int main(int argc, char* argv[]) {
|
|
if (argc < 4) {
|
|
std::cout << "Usage: infer_demo path/to/model_dir path/to/video frame "
|
|
"number run_option, "
|
|
"e.g ./infer_model ./vsr_model_dir ./vsr_src.mp4 0 2"
|
|
<< std::endl;
|
|
std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
|
|
"with gpu; 2: run with gpu and use tensorrt backend."
|
|
<< std::endl;
|
|
return -1;
|
|
}
|
|
|
|
int frame_num = 2;
|
|
if (argc == 5) {
|
|
frame_num = std::atoi(argv[4]);
|
|
}
|
|
if (std::atoi(argv[3]) == 0) {
|
|
CpuInfer(argv[1], argv[2], frame_num);
|
|
} else if (std::atoi(argv[3]) == 1) {
|
|
GpuInfer(argv[1], argv[2], frame_num);
|
|
} else if (std::atoi(argv[3]) == 2) {
|
|
TrtInfer(argv[1], argv[2], frame_num);
|
|
}
|
|
return 0;
|
|
}
|