From d19510fe770e5cb22982439b2c7dd65af65b48b0 Mon Sep 17 00:00:00 2001
From: yunyaoXYY <109218879+yunyaoXYY@users.noreply.github.com>
Date: Thu, 8 Dec 2022 23:32:14 +0800
Subject: [PATCH 01/77] [Other] Update PP-OCRv2/v3 example. (#838)

* Fix links in readme

* Fix links in readme

* Update PPOCRv2/v3 examples
---
 examples/vision/ocr/PP-OCRv2/cpp/infer.cc    | 17 +++++++++++++---
 examples/vision/ocr/PP-OCRv2/python/infer.py | 21 ++++++++++++++++----
 examples/vision/ocr/PP-OCRv3/cpp/infer.cc    | 18 ++++++++++++++---
 examples/vision/ocr/PP-OCRv3/python/infer.py | 21 ++++++++++++++++----
 4 files changed, 63 insertions(+), 14 deletions(-)

diff --git a/examples/vision/ocr/PP-OCRv2/cpp/infer.cc b/examples/vision/ocr/PP-OCRv2/cpp/infer.cc
index 7bac320d5..6cde6390f 100644
--- a/examples/vision/ocr/PP-OCRv2/cpp/infer.cc
+++ b/examples/vision/ocr/PP-OCRv2/cpp/infer.cc
@@ -33,13 +33,18 @@ void InitAndInfer(const std::string& det_model_dir, const std::string& cls_model
   auto cls_option = option;
   auto rec_option = option;
 
+  // The cls and rec model can inference a batch of images now.
+  // User could initialize the inference batch size and set them after create PPOCR model.
+  int cls_batch_size = 1;
+  int rec_batch_size = 6;
+
   // If use TRT backend, the dynamic shape will be set as follow.
   // We recommend that users set the length and height of the detection model to a multiple of 32.
   det_option.SetTrtInputShape("x", {1, 3, 64,64}, {1, 3, 640, 640},
                                 {1, 3, 960, 960});
-  cls_option.SetTrtInputShape("x", {1, 3, 48, 10}, {10, 3, 48, 320}, {32, 3, 48, 1024});
-  rec_option.SetTrtInputShape("x", {1, 3, 32, 10}, {10, 3, 32, 320},
-                                {32, 3, 32, 2304});
+  cls_option.SetTrtInputShape("x", {1, 3, 48, 10}, {cls_batch_size, 3, 48, 320}, {cls_batch_size, 3, 48, 1024});
+  rec_option.SetTrtInputShape("x", {1, 3, 32, 10}, {rec_batch_size, 3, 32, 320},
+                                {rec_batch_size, 3, 32, 2304});
   
   // Users could save TRT cache file to disk as follow. 
   // det_option.SetTrtCacheFile(det_model_dir + sep + "det_trt_cache.trt");
@@ -58,6 +63,12 @@ void InitAndInfer(const std::string& det_model_dir, const std::string& cls_model
   // auto ppocr_v2 = fastdeploy::pipeline::PPOCRv2(&det_model, &rec_model);
   auto ppocr_v2 = fastdeploy::pipeline::PPOCRv2(&det_model, &cls_model, &rec_model);
 
+  // Set inference batch size for cls model and rec model, the value could be -1 and 1 to positive infinity.
+  // When inference batch size is set to -1, it means that the inference batch size 
+  // of the cls and rec models will be the same as the number of boxes detected by the det model.  
+  ppocr_v2.SetClsBatchSize(cls_batch_size);
+  ppocr_v2.SetRecBatchSize(rec_batch_size);
+
   if(!ppocr_v2.Initialized()){
     std::cerr << "Failed to initialize PP-OCR." << std::endl;
     return;
diff --git a/examples/vision/ocr/PP-OCRv2/python/infer.py b/examples/vision/ocr/PP-OCRv2/python/infer.py
index af915143a..1487d795f 100644
--- a/examples/vision/ocr/PP-OCRv2/python/infer.py
+++ b/examples/vision/ocr/PP-OCRv2/python/infer.py
@@ -106,6 +106,11 @@ rec_label_file = args.rec_label_file
 # 用户也可根据自行需求分别配置
 runtime_option = build_option(args)
 
+# PPOCR的cls和rec模型现在已经支持推理一个Batch的数据
+# 定义下面两个变量后, 可用于设置trt输入shape, 并在PPOCR模型初始化后, 完成Batch推理设置
+cls_batch_size = 1
+rec_batch_size = 6
+
 # 当使用TRT时，分别给三个模型的runtime设置动态shape,并完成模型的创建.
 # 注意: 需要在检测模型创建完成后，再设置分类模型的动态输入并创建分类模型, 识别模型同理.
 # 如果用户想要自己改动检测模型的输入shape, 我们建议用户把检测模型的长和高设置为32的倍数.
@@ -118,16 +123,18 @@ det_model = fd.vision.ocr.DBDetector(
     det_model_file, det_params_file, runtime_option=det_option)
 
 cls_option = runtime_option
-cls_option.set_trt_input_shape("x", [1, 3, 48, 10], [10, 3, 48, 320],
-                               [32, 3, 48, 1024])
+cls_option.set_trt_input_shape("x", [1, 3, 48, 10],
+                               [cls_batch_size, 3, 48, 320],
+                               [cls_batch_size, 3, 48, 1024])
 # 用户可以把TRT引擎文件保存至本地
 # cls_option.set_trt_cache_file(args.cls_model  + "/cls_trt_cache.trt")
 cls_model = fd.vision.ocr.Classifier(
     cls_model_file, cls_params_file, runtime_option=cls_option)
 
 rec_option = runtime_option
-rec_option.set_trt_input_shape("x", [1, 3, 32, 10], [10, 3, 32, 320],
-                               [32, 3, 32, 2304])
+rec_option.set_trt_input_shape("x", [1, 3, 32, 10],
+                               [rec_batch_size, 3, 32, 320],
+                               [rec_batch_size, 3, 32, 2304])
 # 用户可以把TRT引擎文件保存至本地
 # rec_option.set_trt_cache_file(args.rec_model  + "/rec_trt_cache.trt")
 rec_model = fd.vision.ocr.Recognizer(
@@ -137,6 +144,12 @@ rec_model = fd.vision.ocr.Recognizer(
 ppocr_v2 = fd.vision.ocr.PPOCRv2(
     det_model=det_model, cls_model=cls_model, rec_model=rec_model)
 
+# 给cls和rec模型设置推理时的batch size
+# 此值能为-1, 和1到正无穷
+# 当此值为-1时, cls和rec模型的batch size将默认和det模型检测出的框的数量相同
+ppocr_v2.cls_batch_size = cls_batch_size
+ppocr_v2.rec_batch_size = rec_batch_size
+
 # 预测图片准备
 im = cv2.imread(args.image)
 
diff --git a/examples/vision/ocr/PP-OCRv3/cpp/infer.cc b/examples/vision/ocr/PP-OCRv3/cpp/infer.cc
index 911b311e3..90b77679f 100644
--- a/examples/vision/ocr/PP-OCRv3/cpp/infer.cc
+++ b/examples/vision/ocr/PP-OCRv3/cpp/infer.cc
@@ -33,13 +33,19 @@ void InitAndInfer(const std::string& det_model_dir, const std::string& cls_model
   auto cls_option = option;
   auto rec_option = option;
 
+  // The cls and rec model can inference a batch of images now.
+  // User could initialize the inference batch size and set them after create PPOCR model.
+  int cls_batch_size = 1;
+  int rec_batch_size = 6;
+
   // If use TRT backend, the dynamic shape will be set as follow.
   // We recommend that users set the length and height of the detection model to a multiple of 32.
+  // We also recommend that users set the Trt input shape as follow.
   det_option.SetTrtInputShape("x", {1, 3, 64,64}, {1, 3, 640, 640},
                                 {1, 3, 960, 960});
-  cls_option.SetTrtInputShape("x", {1, 3, 48, 10}, {10, 3, 48, 320}, {64, 3, 48, 1024});
-  rec_option.SetTrtInputShape("x", {1, 3, 48, 10}, {10, 3, 48, 320},
-                                {64, 3, 48, 2304});
+  cls_option.SetTrtInputShape("x", {1, 3, 48, 10}, {cls_batch_size, 3, 48, 320}, {cls_batch_size, 3, 48, 1024});
+  rec_option.SetTrtInputShape("x", {1, 3, 48, 10}, {rec_batch_size, 3, 48, 320},
+                                {rec_batch_size, 3, 48, 2304});
   
   // Users could save TRT cache file to disk as follow. 
   // det_option.SetTrtCacheFile(det_model_dir + sep + "det_trt_cache.trt");
@@ -57,6 +63,12 @@ void InitAndInfer(const std::string& det_model_dir, const std::string& cls_model
   // The classification model is optional, so the PP-OCR can also be connected in series as follows
   // auto ppocr_v3 = fastdeploy::pipeline::PPOCRv3(&det_model, &rec_model);
   auto ppocr_v3 = fastdeploy::pipeline::PPOCRv3(&det_model, &cls_model, &rec_model);
+  
+  // Set inference batch size for cls model and rec model, the value could be -1 and 1 to positive infinity.
+  // When inference batch size is set to -1, it means that the inference batch size 
+  // of the cls and rec models will be the same as the number of boxes detected by the det model.  
+  ppocr_v3.SetClsBatchSize(cls_batch_size);
+  ppocr_v3.SetRecBatchSize(rec_batch_size);
 
   if(!ppocr_v3.Initialized()){
     std::cerr << "Failed to initialize PP-OCR." << std::endl;
diff --git a/examples/vision/ocr/PP-OCRv3/python/infer.py b/examples/vision/ocr/PP-OCRv3/python/infer.py
index b6b27b240..1ec962cb5 100644
--- a/examples/vision/ocr/PP-OCRv3/python/infer.py
+++ b/examples/vision/ocr/PP-OCRv3/python/infer.py
@@ -106,6 +106,11 @@ rec_label_file = args.rec_label_file
 # 用户也可根据自行需求分别配置
 runtime_option = build_option(args)
 
+# PPOCR的cls和rec模型现在已经支持推理一个Batch的数据
+# 定义下面两个变量后, 可用于设置trt输入shape, 并在PPOCR模型初始化后, 完成Batch推理设置
+cls_batch_size = 1
+rec_batch_size = 6
+
 # 当使用TRT时，分别给三个模型的runtime设置动态shape,并完成模型的创建.
 # 注意: 需要在检测模型创建完成后，再设置分类模型的动态输入并创建分类模型, 识别模型同理.
 # 如果用户想要自己改动检测模型的输入shape, 我们建议用户把检测模型的长和高设置为32的倍数.
@@ -118,16 +123,18 @@ det_model = fd.vision.ocr.DBDetector(
     det_model_file, det_params_file, runtime_option=det_option)
 
 cls_option = runtime_option
-cls_option.set_trt_input_shape("x", [1, 3, 48, 10], [10, 3, 48, 320],
-                               [64, 3, 48, 1024])
+cls_option.set_trt_input_shape("x", [1, 3, 48, 10],
+                               [cls_batch_size, 3, 48, 320],
+                               [cls_batch_size, 3, 48, 1024])
 # 用户可以把TRT引擎文件保存至本地
 # cls_option.set_trt_cache_file(args.cls_model  + "/cls_trt_cache.trt")
 cls_model = fd.vision.ocr.Classifier(
     cls_model_file, cls_params_file, runtime_option=cls_option)
 
 rec_option = runtime_option
-rec_option.set_trt_input_shape("x", [1, 3, 48, 10], [10, 3, 48, 320],
-                               [64, 3, 48, 2304])
+rec_option.set_trt_input_shape("x", [1, 3, 48, 10],
+                               [rec_batch_size, 3, 48, 320],
+                               [rec_batch_size, 3, 48, 2304])
 # 用户可以把TRT引擎文件保存至本地
 # rec_option.set_trt_cache_file(args.rec_model  + "/rec_trt_cache.trt")
 rec_model = fd.vision.ocr.Recognizer(
@@ -137,6 +144,12 @@ rec_model = fd.vision.ocr.Recognizer(
 ppocr_v3 = fd.vision.ocr.PPOCRv3(
     det_model=det_model, cls_model=cls_model, rec_model=rec_model)
 
+# 给cls和rec模型设置推理时的batch size
+# 此值能为-1, 和1到正无穷
+# 当此值为-1时, cls和rec模型的batch size将默认和det模型检测出的框的数量相同
+ppocr_v3.cls_batch_size = cls_batch_size
+ppocr_v3.rec_batch_size = rec_batch_size
+
 # 预测图片准备
 im = cv2.imread(args.image)
 

From 22325d23ed1543b7034f3214d7f8be3ff6a1c8db Mon Sep 17 00:00:00 2001
From: MistEO <mistereo@hotmail.com>
Date: Fri, 9 Dec 2022 09:20:55 +0800
Subject: [PATCH 02/77] [Other] Add const modifier to some OCR interface
 parameters (#836)

* [Other] Add const modifier to some OCR interface parameters

* [Other] Add a Predict interface to PPOCR with const parameters

For interface compatibility, I chose to add rather than modify
---
 examples/vision/ocr/PP-OCRv2/cpp/README.md | 1 +
 fastdeploy/vision/ocr/ppocr/classifier.cc  | 2 +-
 fastdeploy/vision/ocr/ppocr/classifier.h   | 2 +-
 fastdeploy/vision/ocr/ppocr/ppocr_v2.cc    | 8 ++++++--
 fastdeploy/vision/ocr/ppocr/ppocr_v2.h     | 1 +
 fastdeploy/vision/ocr/ppocr/recognizer.cc  | 2 +-
 fastdeploy/vision/ocr/ppocr/recognizer.h   | 2 +-
 7 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/examples/vision/ocr/PP-OCRv2/cpp/README.md b/examples/vision/ocr/PP-OCRv2/cpp/README.md
index 965ece716..1bb794f5e 100644
--- a/examples/vision/ocr/PP-OCRv2/cpp/README.md
+++ b/examples/vision/ocr/PP-OCRv2/cpp/README.md
@@ -82,6 +82,7 @@ PPOCRv2 的初始化，由检测，识别模型串联构成(无分类器)
 
 > ```  
 > bool Predict(cv::Mat* img, fastdeploy::vision::OCRResult* result);
+> bool Predict(const cv::Mat& img, fastdeploy::vision::OCRResult* result);
 > ```
 >
 > 模型预测接口，输入一张图片，返回OCR预测结果
diff --git a/fastdeploy/vision/ocr/ppocr/classifier.cc b/fastdeploy/vision/ocr/ppocr/classifier.cc
index 4be9a3556..216d50fd2 100755
--- a/fastdeploy/vision/ocr/ppocr/classifier.cc
+++ b/fastdeploy/vision/ocr/ppocr/classifier.cc
@@ -50,7 +50,7 @@ bool Classifier::Initialize() {
   return true;
 }
 
-bool Classifier::Predict(cv::Mat& img, int32_t* cls_label, float* cls_score) {
+bool Classifier::Predict(const cv::Mat& img, int32_t* cls_label, float* cls_score) {
   std::vector<int32_t> cls_labels(1);
   std::vector<float> cls_scores(1);
   bool success = BatchPredict({img}, &cls_labels, &cls_scores);
diff --git a/fastdeploy/vision/ocr/ppocr/classifier.h b/fastdeploy/vision/ocr/ppocr/classifier.h
index ddc4db27a..5a4ed02a0 100755
--- a/fastdeploy/vision/ocr/ppocr/classifier.h
+++ b/fastdeploy/vision/ocr/ppocr/classifier.h
@@ -43,7 +43,7 @@ class FASTDEPLOY_DECL Classifier : public FastDeployModel {
              const ModelFormat& model_format = ModelFormat::PADDLE);
   /// Get model's name
   std::string ModelName() const { return "ppocr/ocr_cls"; }
-  virtual bool Predict(cv::Mat& img, int32_t* cls_label, float* cls_score);
+  virtual bool Predict(const cv::Mat& img, int32_t* cls_label, float* cls_score);
   /** \brief BatchPredict the input image and get OCR classification model cls_result.
    *
    * \param[in] images The list of input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format.
diff --git a/fastdeploy/vision/ocr/ppocr/ppocr_v2.cc b/fastdeploy/vision/ocr/ppocr/ppocr_v2.cc
index 2ee2f903f..756604dde 100755
--- a/fastdeploy/vision/ocr/ppocr/ppocr_v2.cc
+++ b/fastdeploy/vision/ocr/ppocr/ppocr_v2.cc
@@ -74,11 +74,15 @@ bool PPOCRv2::Initialized() const {
   }
   return true; 
 }
-
 bool PPOCRv2::Predict(cv::Mat* img,
                             fastdeploy::vision::OCRResult* result) {
+  return Predict(*img, result);
+}
+
+bool PPOCRv2::Predict(const cv::Mat& img,
+                            fastdeploy::vision::OCRResult* result) {
   std::vector<fastdeploy::vision::OCRResult> batch_result(1);
-  bool success = BatchPredict({*img},&batch_result);
+  bool success = BatchPredict({img},&batch_result);
   if(!success){
     return success;
   }
diff --git a/fastdeploy/vision/ocr/ppocr/ppocr_v2.h b/fastdeploy/vision/ocr/ppocr/ppocr_v2.h
index 05f2b9309..f603a45f9 100755
--- a/fastdeploy/vision/ocr/ppocr/ppocr_v2.h
+++ b/fastdeploy/vision/ocr/ppocr/ppocr_v2.h
@@ -59,6 +59,7 @@ class FASTDEPLOY_DECL PPOCRv2 : public FastDeployModel {
    * \return true if the prediction successed, otherwise false.
    */
   virtual bool Predict(cv::Mat* img, fastdeploy::vision::OCRResult* result);
+  virtual bool Predict(const cv::Mat& img, fastdeploy::vision::OCRResult* result);
   /** \brief BatchPredict the input image and get OCR result.
    *
    * \param[in] images The list of input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format.
diff --git a/fastdeploy/vision/ocr/ppocr/recognizer.cc b/fastdeploy/vision/ocr/ppocr/recognizer.cc
index a20f312c2..8965e73d9 100755
--- a/fastdeploy/vision/ocr/ppocr/recognizer.cc
+++ b/fastdeploy/vision/ocr/ppocr/recognizer.cc
@@ -53,7 +53,7 @@ bool Recognizer::Initialize() {
   return true;
 }
 
-bool Recognizer::Predict(cv::Mat& img, std::string* text, float* rec_score) {
+bool Recognizer::Predict(const cv::Mat& img, std::string* text, float* rec_score) {
   std::vector<std::string> texts(1);
   std::vector<float> rec_scores(1);
   bool success = BatchPredict({img}, &texts, &rec_scores);
diff --git a/fastdeploy/vision/ocr/ppocr/recognizer.h b/fastdeploy/vision/ocr/ppocr/recognizer.h
index 4ee12bb6a..8a5f5bc70 100755
--- a/fastdeploy/vision/ocr/ppocr/recognizer.h
+++ b/fastdeploy/vision/ocr/ppocr/recognizer.h
@@ -45,7 +45,7 @@ class FASTDEPLOY_DECL Recognizer : public FastDeployModel {
              const ModelFormat& model_format = ModelFormat::PADDLE);
   /// Get model's name
   std::string ModelName() const { return "ppocr/ocr_rec"; }
-  virtual bool Predict(cv::Mat& img, std::string* text, float* rec_score);
+  virtual bool Predict(const cv::Mat& img, std::string* text, float* rec_score);
   /** \brief BatchPredict the input image and get OCR recognition model result.
    *
    * \param[in] images The list of input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format.

From f3c5d4ad763f9e28783bebc74aa5b4b8bb75de3e Mon Sep 17 00:00:00 2001
From: chenjian <chenjian26@baidu.com>
Date: Fri, 9 Dec 2022 10:04:38 +0800
Subject: [PATCH 03/77] [Doc] add fastdeploy client doc (#803)

* add fastdeploy client doc

* update doc
---
 serving/README_CN.md         |   1 +
 serving/docs/zh_CN/client.md | 479 +++++++++++++++++++++++++++++++++++
 2 files changed, 480 insertions(+)
 create mode 100644 serving/docs/zh_CN/client.md

diff --git a/serving/README_CN.md b/serving/README_CN.md
index 84017b399..2c858b6f7 100644
--- a/serving/README_CN.md
+++ b/serving/README_CN.md
@@ -33,6 +33,7 @@ docker pull paddlepaddle/fastdeploy:1.0.0-gpu-cuda11.4-trt8.4-21.10
 - [模型仓库目录说明](docs/zh_CN/model_repository.md) (说明如何准备模型仓库目录)
 - [模型配置说明](docs/zh_CN/model_configuration.md)  (说明runtime的配置选项)
 - [服务化部署示例](docs/zh_CN/demo.md) (服务化部署示例)
+- [客户端访问说明](docs/zh_CN/client.md) (客户端访问说明)
 
 
 ### 服务化部署示例
diff --git a/serving/docs/zh_CN/client.md b/serving/docs/zh_CN/client.md
new file mode 100644
index 000000000..2ca376591
--- /dev/null
+++ b/serving/docs/zh_CN/client.md
@@ -0,0 +1,479 @@
+# 客户端访问说明
+本文以访问使用fastdeployserver部署的yolov5模型为例，讲述客户端如何请求服务端进行推理服务。关于如何使用fastdeployserver部署yolov5模型，可以参考文档[yolov5服务化部署](../../../examples/vision/detection/yolov5/serving)
+
+## 基本原理介绍
+fastdeployserver实现了由[kserve](https://github.com/kserve/kserve)提出的为机器学习模型推理服务而设计的[Predict Protocol协议](https://github.com/kserve/kserve/blob/master/docs/predict-api/v2/required_api.md) API，该API既简单易用同时又支持高性能部署的使用场景，目前提供基于HTTP和GRPC两种网络协议的访问方式。
+
+
+当fastdeployserver启动后，默认情况下，8000端口用于响应HTTP请求，8001端口用于响应GRPC请求。用户需要请求的资源通常有两种：
+
+### **模型的元信息（metadata)**
+
+**HTTP**
+
+访问方式： GET `v2/models/${MODEL_NAME}[/versions/${MODEL_VERSION}]`
+
+使用GET请求该url路径可以获取参与服务的模型的元信息，其中`${MODEL_NAME}`表示模型的名字，${MODEL_VERSION}表示模型的版本。服务器会把模型的元信息以json格式返回，返回的格式为一个字典，以$metadata_model_response表示返回的对象，各字段和内容形式表示如下：
+
+```json
+$metadata_model_response =
+    {
+      "name" : $string,
+      "versions" : [ $string, ... ] #optional,
+      "platform" : $string,
+      "inputs" : [ $metadata_tensor, ... ],
+      "outputs" : [ $metadata_tensor, ... ]
+    }
+
+$metadata_tensor =
+    {
+      "name" : $string,
+      "datatype" : $string,
+      "shape" : [ $number, ... ]
+    }
+```
+
+**GRPC**
+
+模型服务的GRPC定义为
+
+```text
+service GRPCInferenceService
+{
+  // Check liveness of the inference server.
+  rpc ServerLive(ServerLiveRequest) returns (ServerLiveResponse) {}
+
+  // Check readiness of the inference server.
+  rpc ServerReady(ServerReadyRequest) returns (ServerReadyResponse) {}
+
+  // Check readiness of a model in the inference server.
+  rpc ModelReady(ModelReadyRequest) returns (ModelReadyResponse) {}
+
+  // Get server metadata.
+  rpc ServerMetadata(ServerMetadataRequest) returns (ServerMetadataResponse) {}
+
+  // Get model metadata.
+  rpc ModelMetadata(ModelMetadataRequest) returns (ModelMetadataResponse) {}
+
+  // Perform inference using a specific model.
+  rpc ModelInfer(ModelInferRequest) returns (ModelInferResponse) {}
+}
+```
+
+访问方式：使用GRPC客户端调用模型服务GRPC接口中定义的ModelMetadata方法。
+
+接口中请求的ModelMetadataRequest message和返回的ServerMetadataResponse message结构如下，可以看到和上面的HTTP里使用的json结构基本相同。
+
+```text
+message ModelMetadataRequest
+{
+  // The name of the model.
+  string name = 1;
+
+  // The version of the model to check for readiness. If not given the
+  // server will choose a version based on the model and internal policy.
+  string version = 2;
+}
+
+message ModelMetadataResponse
+{
+  // Metadata for a tensor.
+  message TensorMetadata
+  {
+    // The tensor name.
+    string name = 1;
+
+    // The tensor data type.
+    string datatype = 2;
+
+    // The tensor shape. A variable-size dimension is represented
+    // by a -1 value.
+    repeated int64 shape = 3;
+  }
+
+  // The model name.
+  string name = 1;
+
+  // The versions of the model available on the server.
+  repeated string versions = 2;
+
+  // The model's platform. See Platforms.
+  string platform = 3;
+
+  // The model's inputs.
+  repeated TensorMetadata inputs = 4;
+
+  // The model's outputs.
+  repeated TensorMetadata outputs = 5;
+}
+```
+
+
+### **推理服务**
+
+**HTTP**
+
+访问方式：POST `v2/models/${MODEL_NAME}[/versions/${MODEL_VERSION}]/infer`
+
+使用POST请求该url路径可以请求模型的推理服务，获取推理结果。POST请求中的数据同样以json格式上传，以$inference_request表示上传的对象，各字段和内容形式表示如下：
+```json
+ $inference_request =
+    {
+      "id" : $string #optional,
+      "parameters" : $parameters #optional,
+      "inputs" : [ $request_input, ... ],
+      "outputs" : [ $request_output, ... ] #optional
+    }
+
+$request_input =
+    {
+      "name" : $string,
+      "shape" : [ $number, ... ],
+      "datatype"  : $string,
+      "parameters" : $parameters #optional,
+      "data" : $tensor_data
+    }
+
+$request_output =
+    {
+      "name" : $string,
+      "parameters" : $parameters #optional,
+    }
+
+$parameters =
+{
+  $parameter, ...
+}
+
+$parameter = $string : $string | $number | $boolean
+```
+其中$tensor_data表示一维或多维数组，如果是一维数据，必须按照行主序的方式进行排列tensor中的数据。
+服务器推理完成后，返回结果数据，以$inference_response表示返回的对象，各字段和内容形式表示如下：
+
+```json
+$inference_response =
+    {
+      "model_name" : $string,
+      "model_version" : $string #optional,
+      "id" : $string,
+      "parameters" : $parameters #optional,
+      "outputs" : [ $response_output, ... ]
+    }
+
+$response_output =
+    {
+      "name" : $string,
+      "shape" : [ $number, ... ],
+      "datatype"  : $string,
+      "parameters" : $parameters #optional,
+      "data" : $tensor_data
+    }
+```
+
+**GRPC**
+
+访问方式：使用GRPC客户端调用模型服务GRPC接口中定义的ModelInfer方法。
+
+接口中请求的ModelInferRequest message和返回的ModelInferResponse message结构如下，更完整的结构定义可以参考kserve Predict Protocol [GRPC部分](https://github.com/kserve/kserve/blob/master/docs/predict-api/v2/required_api.md#grpc)
+
+```text
+message ModelInferRequest
+{
+  // An input tensor for an inference request.
+  message InferInputTensor
+  {
+    // The tensor name.
+    string name = 1;
+
+    // The tensor data type.
+    string datatype = 2;
+
+    // The tensor shape.
+    repeated int64 shape = 3;
+
+    // Optional inference input tensor parameters.
+    map<string, InferParameter> parameters = 4;
+
+    // The tensor contents using a data-type format. This field must
+    // not be specified if "raw" tensor contents are being used for
+    // the inference request.
+    InferTensorContents contents = 5;
+  }
+
+  // An output tensor requested for an inference request.
+  message InferRequestedOutputTensor
+  {
+    // The tensor name.
+    string name = 1;
+
+    // Optional requested output tensor parameters.
+    map<string, InferParameter> parameters = 2;
+  }
+
+  // The name of the model to use for inferencing.
+  string model_name = 1;
+
+  // The version of the model to use for inference. If not given the
+  // server will choose a version based on the model and internal policy.
+  string model_version = 2;
+
+  // Optional identifier for the request. If specified will be
+  // returned in the response.
+  string id = 3;
+
+  // Optional inference parameters.
+  map<string, InferParameter> parameters = 4;
+
+  // The input tensors for the inference.
+  repeated InferInputTensor inputs = 5;
+
+  // The requested output tensors for the inference. Optional, if not
+  // specified all outputs produced by the model will be returned.
+  repeated InferRequestedOutputTensor outputs = 6;
+
+  // The data contained in an input tensor can be represented in "raw"
+  // bytes form or in the repeated type that matches the tensor's data
+  // type. To use the raw representation 'raw_input_contents' must be
+  // initialized with data for each tensor in the same order as
+  // 'inputs'. For each tensor, the size of this content must match
+  // what is expected by the tensor's shape and data type. The raw
+  // data must be the flattened, one-dimensional, row-major order of
+  // the tensor elements without any stride or padding between the
+  // elements. Note that the FP16 and BF16 data types must be represented as
+  // raw content as there is no specific data type for a 16-bit float type.
+  //
+  // If this field is specified then InferInputTensor::contents must
+  // not be specified for any input tensor.
+  repeated bytes raw_input_contents = 7;
+}
+
+message ModelInferResponse
+{
+  // An output tensor returned for an inference request.
+  message InferOutputTensor
+  {
+    // The tensor name.
+    string name = 1;
+
+    // The tensor data type.
+    string datatype = 2;
+
+    // The tensor shape.
+    repeated int64 shape = 3;
+
+    // Optional output tensor parameters.
+    map<string, InferParameter> parameters = 4;
+
+    // The tensor contents using a data-type format. This field must
+    // not be specified if "raw" tensor contents are being used for
+    // the inference response.
+    InferTensorContents contents = 5;
+  }
+
+  // The name of the model used for inference.
+  string model_name = 1;
+
+  // The version of the model used for inference.
+  string model_version = 2;
+
+  // The id of the inference request if one was specified.
+  string id = 3;
+
+  // Optional inference response parameters.
+  map<string, InferParameter> parameters = 4;
+
+  // The output tensors holding inference results.
+  repeated InferOutputTensor outputs = 5;
+
+  // The data contained in an output tensor can be represented in
+  // "raw" bytes form or in the repeated type that matches the
+  // tensor's data type. To use the raw representation 'raw_output_contents'
+  // must be initialized with data for each tensor in the same order as
+  // 'outputs'. For each tensor, the size of this content must match
+  // what is expected by the tensor's shape and data type. The raw
+  // data must be the flattened, one-dimensional, row-major order of
+  // the tensor elements without any stride or padding between the
+  // elements. Note that the FP16 and BF16 data types must be represented as
+  // raw content as there is no specific data type for a 16-bit float type.
+  //
+  // If this field is specified then InferOutputTensor::contents must
+  // not be specified for any output tensor.
+  repeated bytes raw_output_contents = 6;
+}
+```
+
+
+## 客户端工具
+
+了解了fastdeployserver服务提供的接口之后，用户可以HTTP客户端工具来请求HTTP服务器，或者是使用GRPC客户端工具请求GRPC服务器。默认情况下，fastdeployserver启动后，8000端口用于响应HTTP请求，8001端口用于响应GRPC请求。
+
+### 使用HTTP客户端
+
+这里分别介绍如何使用tritonclient和requests库来访问fastdeployserver的HTTP服务，第一种工具是专门为模型服务做的客户端，对请求和响应进行了封装，方便用户使用。而第二种工具通用的http客户端工具，使用该工具进行访问可以帮助用户更好地理解上述原理描述中的数据结构。
+
+一. 使用tritonclient访问服务
+
+安装tritonclient\[http\]
+
+```bash
+pip install tritonclient[http]
+```
+
+1.获取yolov5的模型元数据
+```python
+import tritonclient.http as httpclient  # 导入httpclient
+server_addr = 'localhost:8000'  # 这里写fastdeployserver服务器的实际地址
+client = httpclient.InferenceServerClient(server_addr)  # 创建client
+model_metadata = client.get_model_metadata(
+      model_name='yolov5', model_version='1') # 请求yolov5模型的元数据
+```
+可以打印看一下模型的输入和输出有哪些
+```python
+print(model_metadata.inputs)
+```
+
+```text
+[{'name': 'INPUT', 'datatype': 'UINT8', 'shape': [-1, -1, -1, 3]}]
+```
+
+```python
+print(model_metadata.outputs)
+```
+
+```text
+[{'name': 'detction_result', 'datatype': 'BYTES', 'shape': [-1, -1]}]
+```
+
+2.请求推理服务
+
+根据模型的inputs和outputs构造数据，然后请求推理
+
+```python
+# 假设图像数据的文件名为000000014439.jpg
+import cv2
+image = cv2.imread('000000014439.jpg')
+image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)[None]
+
+inputs = []
+infer_input = httpclient.InferInput('INPUT', image.shape, 'UINT8') # 构造输入
+infer_input.set_data_from_numpy(image)  # 载入输入数据
+inputs.append(infer_input)
+outputs = []
+infer_output = httpclient.InferRequestedOutput('detction_result') # 构造输出
+outputs.append(infer_output)
+response = client.infer(
+            'yolov5', inputs, model_version='1', outputs=outputs)  # 请求推理
+response_outputs = response.as_numpy('detction_result') # 根据输出变量名获取结果
+```
+
+二. 使用requests访问服务
+
+安装requests
+```bash
+pip install requests
+```
+1.获取yolov5的模型元数据
+
+```python
+import requests
+url = 'http://localhost:8000/v2/models/yolov5/versions/1' # 根据上述章节中"模型的元信息"的获取接口构造url
+response = requests.get(url)
+response = response.json() # 返回数据为json，以json格式解析
+```
+打印一下返回的模型元数据
+```python
+print(response)
+```
+```text
+{'name': 'yolov5', 'versions': ['1'], 'platform': 'ensemble', 'inputs': [{'name': 'INPUT', 'datatype': 'UINT8', 'shape': [-1, -1, -1, 3]}], 'outputs': [{'name': 'detction_result', 'datatype': 'BYTES', 'shape': [-1, -1]}]}
+```
+2.请求推理服务
+
+根据模型的inputs和outputs构造数据，然后请求推理。
+```python
+url = 'http://localhost:8000/v2/models/yolov5/versions/1/infer' # 根据上述章节中"推理服务"的接口构造url
+# 假设图像数据的文件名为000000014439.jpg
+import cv2
+image = cv2.imread('000000014439.jpg')
+image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)[None]
+
+payload = {
+  "inputs" : [
+    {
+      "name" : "INPUT",
+      "shape" : image.shape,
+      "datatype" : "UINT8",
+      "data" : image.tolist()
+    }
+  ],
+  "outputs" : [
+    {
+      "name" : "detction_result"
+    }
+  ]
+}
+response = requests.post(url, data=json.dumps(payload))
+response = response.json()  # 返回数据为json，以json格式解析后即为推理后返回的结果
+```
+
+### 使用GRPC客户端
+
+安装tritonclient\[grpc\]
+```bash
+pip install tritonclient[grpc]
+```
+tritonclient\[grpc\]提供了使用GRPC的客户端，并且对GRPC的交互进行了封装，使得用户不用手动和服务端建立连接，也不用去直接使用grpc的stub去调用服务器的接口，而是封装后给用户提供了和tritonclient HTTP客户端一样的接口进行使用。
+
+1.获取yolov5的模型元数据
+```python
+import tritonclient.grpc as grpcclient # 导入grpc客户端
+server_addr = 'localhost:8001'  # 这里写fastdeployserver grpc服务器的实际地址
+client = grpcclient.InferenceServerClient(server_addr)  # 创建client
+model_metadata = client.get_model_metadata(
+      model_name='yolov5', model_version='1') # 请求yolov5模型的元数据
+```
+2.请求推理服务
+根据返回的model_metadata来构造请求数据。首先看一下模型的输入和输出有哪些
+```python
+print(model_metadata.inputs)
+```
+```text
+[name: "INPUT"
+datatype: "UINT8"
+shape: -1
+shape: -1
+shape: -1
+shape: 3
+]
+```
+
+```python
+print(model_metadata.outputs)
+```
+
+```text
+[name: "detction_result"
+datatype: "BYTES"
+shape: -1
+shape: -1
+]
+```
+
+根据模型的inputs和outputs构造数据，然后请求推理
+```python
+# 假设图像数据的文件名为000000014439.jpg
+import cv2
+image = cv2.imread('000000014439.jpg')
+image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)[None]
+
+inputs = []
+infer_input = grpcclient.InferInput('INPUT', image.shape, 'UINT8') # 构造输入
+infer_input.set_data_from_numpy(image)  # 载入输入数据
+inputs.append(infer_input)
+outputs = []
+infer_output = grpcclient.InferRequestedOutput('detction_result') # 构造输出
+outputs.append(infer_output)
+response = client.infer(
+            'yolov5', inputs, model_version='1', outputs=outputs)  # 请求推理
+response_outputs = response.as_numpy('detction_result') # 根据输出变量名获取结果
+```

From 788ca79e5f2574745735cbae274c1d24abf6b79b Mon Sep 17 00:00:00 2001
From: Zeref996 <53218160+Zeref996@users.noreply.github.com>
Date: Fri, 9 Dec 2022 10:50:37 +0800
Subject: [PATCH 04/77] Fix doc version (#841)

* Change FastDeploy Doc Version from 1.0.0 to 1.0.1

* fix android doc version

* fix android doc version 1
---
 .../download_prebuilt_libraries.md            | 18 +++++++--------
 .../download_prebuilt_libraries.md            | 22 +++++++++----------
 2 files changed, 20 insertions(+), 20 deletions(-)

diff --git a/docs/cn/build_and_install/download_prebuilt_libraries.md b/docs/cn/build_and_install/download_prebuilt_libraries.md
index 2f48c2c06..1a2c4f94e 100755
--- a/docs/cn/build_and_install/download_prebuilt_libraries.md
+++ b/docs/cn/build_and_install/download_prebuilt_libraries.md
@@ -20,7 +20,7 @@ FastDeploy提供各平台预编译库，供开发者直接下载安装使用。
 
 ### Python安装
 
-Release版本（当前最新1.0.0）安装
+Release版本（当前最新1.0.1）安装
 ```bash
 pip install fastdeploy-gpu-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
 ```
@@ -41,8 +41,8 @@ Release版本
 
 | 平台 | 文件 | 说明 |
 | :--- | :--- | :---- |
-| Linux x64 | [fastdeploy-linux-x64-gpu-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-gpu-1.0.0.tgz) | g++ 8.2, CUDA 11.2, cuDNN 8.2编译产出 |
-| Windows x64 | [fastdeploy-win-x64-gpu-1.0.0.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-gpu-1.0.0.zip) | Visual Studio 16 2019, CUDA 11.2, cuDNN 8.2编译产出 |
+| Linux x64 | [fastdeploy-linux-x64-gpu-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-gpu-1.0.1.tgz) | g++ 8.2, CUDA 11.2, cuDNN 8.2编译产出 |
+| Windows x64 | [fastdeploy-win-x64-gpu-1.0.1.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-gpu-1.0.1.zip) | Visual Studio 16 2019, CUDA 11.2, cuDNN 8.2编译产出 |
 
 Develop版本（Nightly build）
 
@@ -63,7 +63,7 @@ Develop版本（Nightly build）
 
 ### Python安装
 
-Release版本（当前最新1.0.0）安装
+Release版本（当前最新1.0.1）安装
 ```bash
 pip install fastdeploy-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
 ```
@@ -79,11 +79,11 @@ Release版本
 
 | 平台 | 文件 | 说明 |
 | :--- | :--- | :---- |
-| Linux x64 | [fastdeploy-linux-x64-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-1.0.0.tgz) | g++ 8.2编译产出 |
-| Windows x64 | [fastdeploy-win-x64-1.0.0.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-1.0.0.zip) | Visual Studio 16 2019编译产出 |
-| Mac OSX x64 | [fastdeploy-osx-x86_64-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-x86_64-1.0.0.tgz) | clang++ 10.0.0编译产出|
-| Mac OSX arm64 | [fastdeploy-osx-arm64-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-arm64-1.0.0.tgz) | clang++ 13.0.0编译产出 |
-| Linux aarch64 | [fastdeploy-osx-arm64-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-aarch64-1.0.0.tgz) | gcc 6.3编译产出 |  
+| Linux x64 | [fastdeploy-linux-x64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-1.0.1.tgz) | g++ 8.2编译产出 |
+| Windows x64 | [fastdeploy-win-x64-1.0.1.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-1.0.1.zip) | Visual Studio 16 2019编译产出 |
+| Mac OSX x64 | [fastdeploy-osx-x86_64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-x86_64-1.0.1.tgz) | clang++ 10.0.0编译产出|
+| Mac OSX arm64 | [fastdeploy-osx-arm64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-arm64-1.0.1.tgz) | clang++ 13.0.0编译产出 |
+| Linux aarch64 | [fastdeploy-osx-arm64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-aarch64-1.0.1.tgz) | gcc 6.3编译产出 |  
 | Android armv7&v8 | [fastdeploy-android-1.0.0-shared.tgz](https://bj.bcebos.com/fastdeploy/release/android/fastdeploy-android-1.0.0-shared.tgz) | NDK 25及clang++编译产出, 支持arm64-v8a及armeabi-v7a |
 
 ## Java SDK安装
diff --git a/docs/en/build_and_install/download_prebuilt_libraries.md b/docs/en/build_and_install/download_prebuilt_libraries.md
index 52dbdd627..37b199ba0 100644
--- a/docs/en/build_and_install/download_prebuilt_libraries.md
+++ b/docs/en/build_and_install/download_prebuilt_libraries.md
@@ -22,7 +22,7 @@ FastDeploy supports Computer Vision, Text and NLP model deployment on CPU and Nv
 
 ### Python SDK
 
-Install the released version（the newest 1.0.0 for now）
+Install the released version（the newest 1.0.1 for now）
 
 ```
 pip install fastdeploy-gpu-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
@@ -42,12 +42,12 @@ conda config --add channels conda-forge && conda install cudatoolkit=11.2 cudnn=
 
 ### C++ SDK
 
-Install the released version（Latest 1.0.0）
+Install the released version（Latest 1.0.1）
 
 | Platform    | File                                                                                                                  | Description                                               |
 |:----------- |:--------------------------------------------------------------------------------------------------------------------- |:--------------------------------------------------------- |
-| Linux x64 | [fastdeploy-linux-x64-gpu-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-gpu-1.0.0.tgz) | g++ 8.2, CUDA 11.2, cuDNN 8.2 |
-| Windows x64 | [fastdeploy-win-x64-gpu-1.0.0.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-gpu-1.0.0.zip) | Visual Studio 16 2019, CUDA 11.2, cuDNN 8.2 |
+| Linux x64 | [fastdeploy-linux-x64-gpu-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-gpu-1.0.1.tgz) | g++ 8.2, CUDA 11.2, cuDNN 8.2 |
+| Windows x64 | [fastdeploy-win-x64-gpu-1.0.1.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-gpu-1.0.1.zip) | Visual Studio 16 2019, CUDA 11.2, cuDNN 8.2 |
 
 Install the Develop version（Nightly build）
 
@@ -69,7 +69,7 @@ FastDeploy supports computer vision, text and NLP model deployment on CPU with P
 
 ### Python SDK
 
-Install the released version（Latest 1.0.0 for now）
+Install the released version（Latest 1.0.1 for now）
 
 ```
 pip install fastdeploy-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
@@ -83,15 +83,15 @@ pip install fastdeploy-python==0.0.0 -f https://www.paddlepaddle.org.cn/whl/fast
 
 ### C++ SDK
 
-Install the released version（Latest 1.0.0 for now, Android is 1.0.0）
+Install the released version（Latest 1.0.1 for now, Android is 1.0.1）
 
 | Platform      | File                                                                                                                  | Description                    |
 |:------------- |:--------------------------------------------------------------------------------------------------------------------- |:------------------------------ |
-| Linux x64 | [fastdeploy-linux-x64-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-1.0.0.tgz) | g++ 8.2 |
-| Windows x64 | [fastdeploy-win-x64-1.0.0.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-1.0.0.zip) | Visual Studio 16 2019 |
-| Mac OSX x64 | [fastdeploy-osx-x86_64-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-x86_64-1.0.0.tgz) | clang++ 10.0.0|
-| Mac OSX arm64 | [fastdeploy-osx-arm64-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-arm64-1.0.0.tgz) | clang++ 13.0.0 |
-| Linux aarch64 | [fastdeploy-osx-arm64-1.0.0.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-aarch64-1.0.0.tgz) | gcc 6.3 |  
+| Linux x64 | [fastdeploy-linux-x64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-1.0.1.tgz) | g++ 8.2 |
+| Windows x64 | [fastdeploy-win-x64-1.0.1.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-1.0.1.zip) | Visual Studio 16 2019 |
+| Mac OSX x64 | [fastdeploy-osx-x86_64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-x86_64-1.0.1.tgz) | clang++ 10.0.0|
+| Mac OSX arm64 | [fastdeploy-osx-arm64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-arm64-1.0.1.tgz) | clang++ 13.0.0 |
+| Linux aarch64 | [fastdeploy-osx-arm64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-aarch64-1.0.1.tgz) | gcc 6.3 |  
 | Android armv7&v8 | [fastdeploy-android-1.0.0-shared.tgz](https://bj.bcebos.com/fastdeploy/release/android/fastdeploy-android-1.0.0-shared.tgz)| NDK 25, clang++, support arm64-v8a及armeabi-v7a |
 
 ## Java SDK

From b0988bf423ec96d9da203bec6773adefae2e1f4c Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 9 Dec 2022 11:41:19 +0800
Subject: [PATCH 05/77] [Compile] Support custom paddle inference (#839)

* Support custom paddle inference

* update setup.py
---
 cmake/paddle_inference.cmake | 93 +++++++++++++++++++++---------------
 python/setup.py              |  2 +
 2 files changed, 56 insertions(+), 39 deletions(-)

diff --git a/cmake/paddle_inference.cmake b/cmake/paddle_inference.cmake
index f1b5ee6c7..3ab45454a 100644
--- a/cmake/paddle_inference.cmake
+++ b/cmake/paddle_inference.cmake
@@ -13,6 +13,8 @@
 # limitations under the License.
 include(ExternalProject)
 
+option(PADDLEINFERENCE_DIRECTORY "Directory of Paddle Inference library" OFF)
+
 set(PADDLEINFERENCE_PROJECT "extern_paddle_inference")
 set(PADDLEINFERENCE_PREFIX_DIR ${THIRD_PARTY_PATH}/paddle_inference)
 set(PADDLEINFERENCE_SOURCE_DIR
@@ -27,6 +29,10 @@ set(PADDLEINFERENCE_LIB_DIR
 set(CMAKE_BUILD_RPATH "${CMAKE_BUILD_RPATH}"
                       "${PADDLEINFERENCE_LIB_DIR}")
 
+if(PADDLEINFERENCE_DIRECTORY)
+  set(PADDLEINFERENCE_INC_DIR ${PADDLEINFERENCE_DIRECTORY}/paddle/include)
+endif()
+
 include_directories(${PADDLEINFERENCE_INC_DIR})
 if(WIN32)
   set(PADDLEINFERENCE_COMPILE_LIB
@@ -47,50 +53,59 @@ else()
 endif(WIN32)
 
 
-set(PADDLEINFERENCE_URL_BASE "https://bj.bcebos.com/fastdeploy/third_libs/")
-set(PADDLEINFERENCE_VERSION "2.4-dev3")
-if(WIN32)
-  if (WITH_GPU)
-    set(PADDLEINFERENCE_FILE "paddle_inference-win-x64-gpu-trt-${PADDLEINFERENCE_VERSION}.zip")
-  else()
-    set(PADDLEINFERENCE_FILE "paddle_inference-win-x64-${PADDLEINFERENCE_VERSION}.zip")
-  endif()
-elseif(APPLE)
-  if(CURRENT_OSX_ARCH MATCHES "arm64")
-    message(FATAL_ERROR "Paddle Backend doesn't support Mac OSX with Arm64 now.")
-    set(PADDLEINFERENCE_FILE "paddle_inference-osx-arm64-${PADDLEINFERENCE_VERSION}.tgz")
-  else()
-    set(PADDLEINFERENCE_FILE "paddle_inference-osx-x86_64-${PADDLEINFERENCE_VERSION}.tgz")
+if(PADDLEINFERENCE_DIRECTORY)
+  if(EXISTS "${THIRD_PARTY_PATH}/install/paddle_inference")
+    file(REMOVE_RECURSE "${THIRD_PARTY_PATH}/install/paddle_inference")
   endif()
+  find_package(Python COMPONENTS Interpreter Development REQUIRED)
+  message(STATUS "Copying ${PADDLEINFERENCE_DIRECTORY} to ${THIRD_PARTY_PATH}/install/paddle_inference ...")
+  execute_process(COMMAND ${Python_EXECUTABLE} ${PROJECT_SOURCE_DIR}/scripts/copy_directory.py ${PADDLEINFERENCE_DIRECTORY} ${THIRD_PARTY_PATH}/install/paddle_inference)
 else()
-  if(CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "aarch64")
-    message(FATAL_ERROR "Paddle Backend doesn't support linux aarch64 now.")
-    set(PADDLEINFERENCE_FILE "paddle_inference-linux-aarch64-${PADDLEINFERENCE_VERSION}.tgz")
-  else()
-    set(PADDLEINFERENCE_FILE "paddle_inference-linux-x64-${PADDLEINFERENCE_VERSION}.tgz")
-    if(WITH_GPU)
-        set(PADDLEINFERENCE_FILE "paddle_inference-linux-x64-gpu-trt-${PADDLEINFERENCE_VERSION}.tgz")
+  set(PADDLEINFERENCE_URL_BASE "https://bj.bcebos.com/fastdeploy/third_libs/")
+  set(PADDLEINFERENCE_VERSION "2.4-dev3")
+  if(WIN32)
+    if (WITH_GPU)
+      set(PADDLEINFERENCE_FILE "paddle_inference-win-x64-gpu-trt-${PADDLEINFERENCE_VERSION}.zip")
+    else()
+      set(PADDLEINFERENCE_FILE "paddle_inference-win-x64-${PADDLEINFERENCE_VERSION}.zip")
     endif()
-    if (WITH_IPU)
-        set(PADDLEINFERENCE_VERSION "2.4-dev1")
-        set(PADDLEINFERENCE_FILE "paddle_inference-linux-x64-ipu-${PADDLEINFERENCE_VERSION}.tgz")
+  elseif(APPLE)
+    if(CURRENT_OSX_ARCH MATCHES "arm64")
+      message(FATAL_ERROR "Paddle Backend doesn't support Mac OSX with Arm64 now.")
+      set(PADDLEINFERENCE_FILE "paddle_inference-osx-arm64-${PADDLEINFERENCE_VERSION}.tgz")
+    else()
+      set(PADDLEINFERENCE_FILE "paddle_inference-osx-x86_64-${PADDLEINFERENCE_VERSION}.tgz")
+    endif()
+  else()
+    if(CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "aarch64")
+      message(FATAL_ERROR "Paddle Backend doesn't support linux aarch64 now.")
+      set(PADDLEINFERENCE_FILE "paddle_inference-linux-aarch64-${PADDLEINFERENCE_VERSION}.tgz")
+    else()
+      set(PADDLEINFERENCE_FILE "paddle_inference-linux-x64-${PADDLEINFERENCE_VERSION}.tgz")
+      if(WITH_GPU)
+          set(PADDLEINFERENCE_FILE "paddle_inference-linux-x64-gpu-trt-${PADDLEINFERENCE_VERSION}.tgz")
+      endif()
+      if (WITH_IPU)
+          set(PADDLEINFERENCE_VERSION "2.4-dev1")
+          set(PADDLEINFERENCE_FILE "paddle_inference-linux-x64-ipu-${PADDLEINFERENCE_VERSION}.tgz")
+      endif()
     endif()
   endif()
-endif()
-set(PADDLEINFERENCE_URL "${PADDLEINFERENCE_URL_BASE}${PADDLEINFERENCE_FILE}")
-
-ExternalProject_Add(
-  ${PADDLEINFERENCE_PROJECT}
-  ${EXTERNAL_PROJECT_LOG_ARGS}
-  URL ${PADDLEINFERENCE_URL}
-  PREFIX ${PADDLEINFERENCE_PREFIX_DIR}
-  DOWNLOAD_NO_PROGRESS 1
-  CONFIGURE_COMMAND ""
-  BUILD_COMMAND ""
-  UPDATE_COMMAND ""
-  INSTALL_COMMAND
-	${CMAKE_COMMAND} -E copy_directory ${PADDLEINFERENCE_SOURCE_DIR} ${PADDLEINFERENCE_INSTALL_DIR}
-  BUILD_BYPRODUCTS ${PADDLEINFERENCE_COMPILE_LIB})
+  set(PADDLEINFERENCE_URL "${PADDLEINFERENCE_URL_BASE}${PADDLEINFERENCE_FILE}")
+  
+  ExternalProject_Add(
+    ${PADDLEINFERENCE_PROJECT}
+    ${EXTERNAL_PROJECT_LOG_ARGS}
+    URL ${PADDLEINFERENCE_URL}
+    PREFIX ${PADDLEINFERENCE_PREFIX_DIR}
+    DOWNLOAD_NO_PROGRESS 1
+    CONFIGURE_COMMAND ""
+    BUILD_COMMAND ""
+    UPDATE_COMMAND ""
+    INSTALL_COMMAND
+  	${CMAKE_COMMAND} -E copy_directory ${PADDLEINFERENCE_SOURCE_DIR} ${PADDLEINFERENCE_INSTALL_DIR}
+    BUILD_BYPRODUCTS ${PADDLEINFERENCE_COMPILE_LIB})
+endif(PADDLEINFERENCE_DIRECTORY)
 
 if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
   add_custom_target(patchelf_paddle_inference ALL COMMAND  bash -c "PATCHELF_EXE=${PATCHELF_EXE} python ${PROJECT_SOURCE_DIR}/scripts/patch_paddle_inference.py ${PADDLEINFERENCE_INSTALL_DIR}/paddle/lib/libpaddle_inference.so" DEPENDS ${LIBRARY_NAME})
diff --git a/python/setup.py b/python/setup.py
index 1f01322bb..b4dc111c6 100755
--- a/python/setup.py
+++ b/python/setup.py
@@ -78,6 +78,8 @@ setup_configs["LIBRARY_NAME"] = PACKAGE_NAME
 setup_configs["PY_LIBRARY_NAME"] = PACKAGE_NAME + "_main"
 setup_configs["OPENCV_DIRECTORY"] = os.getenv("OPENCV_DIRECTORY", "")
 setup_configs["ORT_DIRECTORY"] = os.getenv("ORT_DIRECTORY", "")
+setup_configs["PADDLEINFERENCE_DIRECTORY"] = os.getenv("PADDLEINFERENCE_DIRECTORY", "")
+
 setup_configs["RKNN2_TARGET_SOC"] = os.getenv("RKNN2_TARGET_SOC", "")
 if setup_configs["RKNN2_TARGET_SOC"] != "" or setup_configs["BUILD_ON_JETSON"] != "OFF":
     REQUIRED_PACKAGES = REQUIRED_PACKAGES.replace("opencv-python", "")

From 3c05c745136bf9947d005de322e488552a7bc163 Mon Sep 17 00:00:00 2001
From: shentanyue <34421038+shentanyue@users.noreply.github.com>
Date: Fri, 9 Dec 2022 13:20:33 +0800
Subject: [PATCH 06/77] [Paddle Lite] Support stable-diffusion model (#830)

* support stable-diffusion model for paddlelite

* update code
---
 fastdeploy/backends/lite/lite_backend.cc | 10 +++++-----
 fastdeploy/pybind/main.cc.in             |  6 +++++-
 fastdeploy/pybind/main.h                 |  6 ++++--
 3 files changed, 14 insertions(+), 8 deletions(-)

diff --git a/fastdeploy/backends/lite/lite_backend.cc b/fastdeploy/backends/lite/lite_backend.cc
index 04f139256..7e3e09f8d 100755
--- a/fastdeploy/backends/lite/lite_backend.cc
+++ b/fastdeploy/backends/lite/lite_backend.cc
@@ -206,24 +206,24 @@ bool LiteBackend::Infer(std::vector<FDTensor>& inputs,
     // Adjust dims only, allocate lazy. 
     tensor->Resize(inputs[i].shape); 
     if (inputs[i].dtype == FDDataType::FP32) {
-      tensor->CopyFromCpu<float, paddle::lite_api::TargetType::kARM>(
+      tensor->CopyFromCpu<float, paddle::lite_api::TargetType::kHost>(
         reinterpret_cast<const float*>(const_cast<void*>(
         inputs[i].CpuData())));
     } else if (inputs[i].dtype == FDDataType::INT32) {
-      tensor->CopyFromCpu<int, paddle::lite_api::TargetType::kARM>(
+      tensor->CopyFromCpu<int, paddle::lite_api::TargetType::kHost>(
         reinterpret_cast<const int*>(const_cast<void*>(
         inputs[i].CpuData())));
     } else if (inputs[i].dtype == FDDataType::INT8) {
-      tensor->CopyFromCpu<int8_t, paddle::lite_api::TargetType::kARM>(
+      tensor->CopyFromCpu<int8_t, paddle::lite_api::TargetType::kHost>(
         reinterpret_cast<const int8_t*>(const_cast<void*>(
         inputs[i].CpuData())));
     } else if (inputs[i].dtype == FDDataType::UINT8) {
-      tensor->CopyFromCpu<uint8_t, paddle::lite_api::TargetType::kARM>(
+      tensor->CopyFromCpu<uint8_t, paddle::lite_api::TargetType::kHost>(
         reinterpret_cast<const uint8_t*>(const_cast<void*>(
         inputs[i].CpuData())));
     } else if (inputs[i].dtype == FDDataType::INT64) {
 #ifdef __aarch64__      
-      tensor->CopyFromCpu<int64_t, paddle::lite_api::TargetType::kARM>(
+      tensor->CopyFromCpu<int64_t, paddle::lite_api::TargetType::kHost>(
         reinterpret_cast<const int64_t*>(const_cast<void*>(
         inputs[i].CpuData())));
 #else 
diff --git a/fastdeploy/pybind/main.cc.in b/fastdeploy/pybind/main.cc.in
index 97aafc64a..1b227edc6 100644
--- a/fastdeploy/pybind/main.cc.in
+++ b/fastdeploy/pybind/main.cc.in
@@ -35,6 +35,8 @@ pybind11::dtype FDDataTypeToNumpyDataType(const FDDataType& fd_dtype) {
     dt = pybind11::dtype::of<double>();
   } else if (fd_dtype == FDDataType::UINT8) {
     dt = pybind11::dtype::of<uint8_t>();
+  } else if (fd_dtype == FDDataType::INT8) {
+    dt = pybind11::dtype::of<int8_t>();
   } else if (fd_dtype == FDDataType::FP16) {
     dt = pybind11::dtype::of<float16>();
   } else {
@@ -55,12 +57,14 @@ FDDataType NumpyDataTypeToFDDataType(const pybind11::dtype& np_dtype) {
     return FDDataType::FP64;
   } else if (np_dtype.is(pybind11::dtype::of<uint8_t>())) {
     return FDDataType::UINT8;
+  } else if (np_dtype.is(pybind11::dtype::of<int8_t>())) {
+    return FDDataType::INT8;
   } else if (np_dtype.is(pybind11::dtype::of<float16>())) {
     return FDDataType::FP16;
   }
   FDASSERT(false,
            "NumpyDataTypeToFDDataType() only support "
-           "int32/int64/float32/float64/float16 now.");
+           "int8/int32/int64/float32/float64/float16 now.");
   return FDDataType::FP32;
 }
 
diff --git a/fastdeploy/pybind/main.h b/fastdeploy/pybind/main.h
index 471579ab1..c0ea4497a 100644
--- a/fastdeploy/pybind/main.h
+++ b/fastdeploy/pybind/main.h
@@ -67,9 +67,11 @@ FDDataType CTypeToFDDataType() {
     return FDDataType::FP32;
   } else if (std::is_same<T, double>::value) {
     return FDDataType::FP64;
+  } else if (std::is_same<T, int8_t>::value) {
+    return FDDataType::INT8;
   }
-  FDASSERT(false,
-           "CTypeToFDDataType only support int32/int64/float32/float64 now.");
+  FDASSERT(false, "CTypeToFDDataType only support "
+           "int8/int32/int64/float32/float64 now.");
   return FDDataType::FP32;
 }
 

From b19fe6a965a2b0a86a1ae27bf97f916138548dac Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 9 Dec 2022 14:28:00 +0800
Subject: [PATCH 07/77] Update cpu.md

---
 docs/cn/build_and_install/cpu.md | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/docs/cn/build_and_install/cpu.md b/docs/cn/build_and_install/cpu.md
index c6fb2a893..b0057e677 100644
--- a/docs/cn/build_and_install/cpu.md
+++ b/docs/cn/build_and_install/cpu.md
@@ -27,6 +27,11 @@ Linux上编译需满足
 - gcc/g++ >= 5.4(推荐8.2)
 - cmake >= 3.18.0
 
+此外更推荐开发者自行安装，编译时通过`-DOPENCV_DIRECTORY`来指定环境中的OpenCV（如若不指定-DOPENCV_DIRECTORY，会自动下载FastDeploy提供的预编译的OpenCV，但在**Linux平台**无法支持Video的读取，以及imshow等可视化界面功能）
+```
+sudo apt-get install libopencv-dev
+```
+
 ```bash
 git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy
@@ -36,6 +41,7 @@ cmake .. -DENABLE_ORT_BACKEND=ON \
          -DENABLE_OPENVINO_BACKEND=ON \
          -DCMAKE_INSTALL_PREFIX=${PWD}/compiled_fastdeploy_sdk \
          -DENABLE_VISION=ON \
+         -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
          -DENABLE_TEXT=ON
 make -j12
 make install
@@ -90,6 +96,8 @@ export ENABLE_PADDLE_BACKEND=ON
 export ENABLE_OPENVINO_BACKEND=ON
 export ENABLE_VISION=ON
 export ENABLE_TEXT=ON
+# OPENCV_DIRECTORY可选，不指定会自动下载FastDeploy提供的预编译OpenCV库
+export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
 
 python setup.py build
 python setup.py bdist_wheel

From 4ccec075a14a3e1404e5bcd6bfc8335ad74431bf Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 9 Dec 2022 14:29:44 +0800
Subject: [PATCH 08/77] Update gpu.md

---
 docs/cn/build_and_install/gpu.md | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/docs/cn/build_and_install/gpu.md b/docs/cn/build_and_install/gpu.md
index 3d6aba116..1e9a0d26f 100644
--- a/docs/cn/build_and_install/gpu.md
+++ b/docs/cn/build_and_install/gpu.md
@@ -33,6 +33,11 @@ Linux上编译需满足
 - cuda >= 11.2
 - cudnn >= 8.2
 
+此外更推荐开发者自行安装，编译时通过`-DOPENCV_DIRECTORY`来指定环境中的OpenCV（如若不指定-DOPENCV_DIRECTORY，会自动下载FastDeploy提供的预编译的OpenCV，但在**Linux平台**无法支持Video的读取，以及imshow等可视化界面功能）
+```
+sudo apt-get install libopencv-dev
+```
+
 ```bash
 git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy
@@ -46,6 +51,7 @@ cmake .. -DENABLE_ORT_BACKEND=ON \
          -DCUDA_DIRECTORY=/usr/local/cuda \
          -DCMAKE_INSTALL_PREFIX=${PWD}/compiled_fastdeploy_sdk \
          -DENABLE_VISION=ON \
+         -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
          -DENABLE_TEXT=ON
 make -j12
 make install
@@ -115,6 +121,8 @@ export ENABLE_TRT_BACKEND=ON
 export WITH_GPU=ON
 export TRT_DIRECTORY=/Paddle/TensorRT-8.4.1.5
 export CUDA_DIRECTORY=/usr/local/cuda
+# OPENCV_DIRECTORY可选，不指定会在编译过程下载FastDeploy预编译的OpenCV库
+export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
 
 python setup.py build
 python setup.py bdist_wheel

From 195132a1c70990a5488fd2eb077368bfea696782 Mon Sep 17 00:00:00 2001
From: DefTruth <31974251+DefTruth@users.noreply.github.com>
Date: Fri, 9 Dec 2022 15:53:26 +0800
Subject: [PATCH 09/77] [Android] Update Android build scripts & app download
 tasks (#835)

* [Android] Add ERNIE3.0 intent and slot task jni support

* [Bug Fix] fix app sdk download tasks

* [Bug Fix] fix app sdk download tasks

* [JNI] remove empty .cc files

* [Android] Update Android build scripts
---
 cmake/paddlelite.cmake                        |   4 +-
 java/android/app/build.gradle                 |  24 ++--
 java/android/fastdeploy/build.gradle          |  10 +-
 scripts/android/build_android_aar.sh          |   9 +-
 scripts/android/build_android_app.sh          |   6 +-
 scripts/android/build_android_cpp.sh          |   2 +-
 .../build_android_cpp_with_text_api.sh        | 118 ++++++++++++++++++
 7 files changed, 146 insertions(+), 27 deletions(-)
 create mode 100755 scripts/android/build_android_cpp_with_text_api.sh

diff --git a/cmake/paddlelite.cmake b/cmake/paddlelite.cmake
index 12a069f6e..299843a6d 100755
--- a/cmake/paddlelite.cmake
+++ b/cmake/paddlelite.cmake
@@ -52,9 +52,9 @@ endif()
 if(WIN32 OR APPLE OR IOS)
   message(FATAL_ERROR "Doesn't support windows/mac/ios platform with backend Paddle Lite now.")
 elseif(ANDROID)
-  set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-android-${ANDROID_ABI}-latest.tgz")
+  set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-android-${ANDROID_ABI}-latest-dev.tgz")
   if(ANDROID_ABI MATCHES "arm64-v8a") 
-    set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-android-${ANDROID_ABI}-fp16-latest.tgz")
+    set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-android-${ANDROID_ABI}-fp16-latest-dev.tgz")
   endif()  
 else() # Linux
   if(CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "aarch64")
diff --git a/java/android/app/build.gradle b/java/android/app/build.gradle
index d58cb3dd5..fde73b3b3 100644
--- a/java/android/app/build.gradle
+++ b/java/android/app/build.gradle
@@ -95,11 +95,13 @@ task downloadAndExtractModels(type: DefaultTask) {
             String[] modelPaths = model.src.split("/")
             String modelName = modelPaths[modelPaths.length - 1]
             String modelPrefix = modelName.substring(0, modelName.length() - 4)
-            // Download the target model if not exists
-            boolean copyFiles = !file("${model.dest}/${modelPrefix}").exists()
-            if (!file("${cachePath}/${modelName}").exists()) {
-                println "[INFO] Downloading ${model.src} -> ${cachePath}/${modelName}"
-                ant.get(src: model.src, dest: file("${cachePath}/${modelName}"))
+            boolean copyFiles = false
+            if (!file("${model.dest}/${modelPrefix}").exists()) {
+                // Download the target model if not exists
+                if (!file("${cachePath}/${modelName}").exists()) {
+                    println "[INFO] Downloading ${model.src} -> ${cachePath}/${modelName}"
+                    ant.get(src: model.src, dest: file("${cachePath}/${modelName}"))
+                }
                 copyFiles = true
             }
             if (copyFiles) {
@@ -127,11 +129,13 @@ task downloadAndExtractSDKs(type: DefaultTask) {
         FD_JAVA_SDK.eachWithIndex { sdk, index ->
             String[] sdkPaths = sdk.src.split("/")
             String sdkName = sdkPaths[sdkPaths.length - 1]
-            // Download the target SDK if not exists
-            boolean copyFiles = !file("${sdk.dest}/${sdkName}").exists()
-            if (!file("${cachePath}/${sdkName}").exists()) {
-                println "[INFO] Downloading ${sdk.src} -> ${cachePath}/${sdkName}"
-                ant.get(src: sdk.src, dest: file("${cachePath}/${sdkName}"))
+            boolean copyFiles = false
+            if (!file("${sdk.dest}/${sdkName}").exists()) {
+                // Download the target SDK if not exists
+                if (file("${cachePath}/${sdkName}").exists()) {
+                    println "[INFO] Downloading ${sdk.src} -> ${cachePath}/${sdkName}"
+                    ant.get(src: sdk.src, dest: file("${cachePath}/${sdkName}"))
+                }
                 copyFiles = true
             }
             if (copyFiles) {
diff --git a/java/android/fastdeploy/build.gradle b/java/android/fastdeploy/build.gradle
index f16248440..d6d4abb7c 100644
--- a/java/android/fastdeploy/build.gradle
+++ b/java/android/fastdeploy/build.gradle
@@ -67,10 +67,12 @@ task downloadAndExtractLibs(type: DefaultTask) {
             String[] libPaths = lib.src.split("/")
             String libName = libPaths[libPaths.length - 1]
             libName = libName.split("\\.")[0]
-            boolean copyFiles = !file("${lib.dest}/${libName}").exists()
-            if (!file("${cachePath}/${libName}.tgz").exists()) {
-                println "[INFO] Downloading ${lib.src} -> ${cachePath}/${libName}.tgz"
-                ant.get(src: lib.src, dest: file("${cachePath}/${libName}.tgz"))
+            boolean copyFiles = false
+            if (!file("${lib.dest}/${libName}").exists()) {
+                if (!file("${cachePath}/${libName}.tgz").exists()) {
+                    println "[INFO] Downloading ${lib.src} -> ${cachePath}/${libName}.tgz"
+                    ant.get(src: lib.src, dest: file("${cachePath}/${libName}.tgz"))
+                }
                 copyFiles = true
             }
             if (copyFiles) {
diff --git a/scripts/android/build_android_aar.sh b/scripts/android/build_android_aar.sh
index bc5a61760..f1e4178b7 100755
--- a/scripts/android/build_android_aar.sh
+++ b/scripts/android/build_android_aar.sh
@@ -2,20 +2,15 @@
 set -e
 set +x
 
-PACKAGE_VERSION=$1
 FASTDEPLOY_DIR=$(pwd)
 BUILT_PACKAGE_DIR=build/Android
-CXX_PACKAGE_PREFIX=fastdeploy-android-${PACKAGE_VERSION}-shared
+CXX_PACKAGE_PREFIX=fastdeploy-android-latest-dev-shared
 CXX_PACKAGE_NAME=${BUILT_PACKAGE_DIR}/${CXX_PACKAGE_PREFIX}
 ARMV8_CXX_PACKAGE_NAME=${BUILT_PACKAGE_DIR}/arm64-v8a-api-21/install
 ARMV7_CXX_PACKAGE_NAME=${BUILT_PACKAGE_DIR}/armeabi-v7a-api-21/install
 
 # check package name
 echo "[INFO] --- FASTDEPLOY_DIR: ${FASTDEPLOY_DIR}"
-if [ "$PACKAGE_VERSION" = "dev" ]; then
-    CXX_PACKAGE_PREFIX=fastdeploy-android-latest-shared-dev
-    CXX_PACKAGE_NAME=${BUILT_PACKAGE_DIR}/fastdeploy-android-latest-shared-dev
-fi
 
 # check arm v7 & v8 c++ sdk
 if [ ! -d "${BUILT_PACKAGE_DIR}" ]; then
@@ -76,4 +71,4 @@ echo "[INFO] --- Built java aar package!"
 ls -lh ${JNI_LIB_DIR}/build/outputs/aar/
 
 # Usage:
-# ./scripts/android/build_android_aar.sh dev
+# ./scripts/android/build_android_aar.sh
diff --git a/scripts/android/build_android_app.sh b/scripts/android/build_android_app.sh
index 24db66fed..5df19148a 100755
--- a/scripts/android/build_android_app.sh
+++ b/scripts/android/build_android_app.sh
@@ -1,4 +1,4 @@
-# build java aar package
+# build FastDeploy app
 FASTDEPLOY_DIR=$(pwd)
 JAVA_ANDROID_DIR=${FASTDEPLOY_DIR}/java/android
 JNI_LIB_DIR=${JAVA_ANDROID_DIR}/fastdeploy
@@ -7,7 +7,7 @@ APP_DIR=${JAVA_ANDROID_DIR}/app
 APP_LIBS_DIR=${APP_DIR}/libs
 
 cd ${JAVA_ANDROID_DIR}
-# check aar package
+# check aar package first!
 echo "[INFO] --- JAVA_ANDROID_DIR: ${JAVA_ANDROID_DIR}"
 if [ ! -d "${JNI_LIB_DIR}/build/outputs/aar" ]; then
    echo "-- [ERROR] ${JNI_LIB_DIR} not exists, please build aar package first!"
@@ -28,7 +28,7 @@ if [ -f "${APP_LIBS_DIR}/fastdeploy-android-sdk-latest-dev.aar" ]; then
     echo "[INFO] --- Update aar package done!"
 fi
 # build android app
-echo "[INFO] --- Building FastDeploy Android app ..."
+echo "[INFO] --- Building FastDeploy Android App ..."
 chmod +x gradlew
 ./gradlew app:assembleDebug
 echo "[INFO] --- Built FastDeploy Android app."
diff --git a/scripts/android/build_android_cpp.sh b/scripts/android/build_android_cpp.sh
index 7ca62330f..5179a5117 100755
--- a/scripts/android/build_android_cpp.sh
+++ b/scripts/android/build_android_cpp.sh
@@ -90,7 +90,7 @@ __build_fastdeploy_android_shared() {
         -DENABLE_LITE_BACKEND=ON \
         -DENABLE_PADDLE_FRONTEND=OFF \
         -DENABLE_FLYCV=ON \
-        -DENABLE_TEXT=ON \
+        -DENABLE_TEXT=OFF \
         -DENABLE_VISION=ON \
         -DENABLE_VISION_VISUALIZE=ON \
         -DBUILD_EXAMPLES=ON \
diff --git a/scripts/android/build_android_cpp_with_text_api.sh b/scripts/android/build_android_cpp_with_text_api.sh
new file mode 100755
index 000000000..ac1ca4e6f
--- /dev/null
+++ b/scripts/android/build_android_cpp_with_text_api.sh
@@ -0,0 +1,118 @@
+#!/bin/bash
+set -e
+set +x
+
+# -------------------------------------------------------------------------------
+#                        mutable global variables
+# -------------------------------------------------------------------------------
+TOOLCHAIN=clang # gcc/clang toolchain
+
+# -------------------------------------------------------------------------------
+#                        readonly global variables
+# -------------------------------------------------------------------------------
+readonly ROOT_PATH=$(pwd)
+readonly ANDROID_ABI=$1
+readonly ANDROID_PLATFORM="android-$2"
+readonly BUILD_ROOT=build/Android
+readonly BUILD_DIR=${BUILD_ROOT}/${ANDROID_ABI}-api-$2
+
+# -------------------------------------------------------------------------------
+#                                 tasks
+# -------------------------------------------------------------------------------
+__make_build_dir() {
+  if [ ! -d "${BUILD_DIR}" ]; then
+    echo "-- [INFO] BUILD_DIR: ${BUILD_DIR} not exists, setup manually ..."
+    if [ ! -d "${BUILD_ROOT}" ]; then
+      mkdir -p "${BUILD_ROOT}" && echo "-- [INFO] Created ${BUILD_ROOT} !"
+    fi
+    mkdir -p "${BUILD_DIR}" && echo "-- [INFO] Created ${BUILD_DIR} !"
+  else
+    echo "-- [INFO] Found BUILD_DIR: ${BUILD_DIR}"
+  fi
+}
+
+__check_cxx_envs() {
+  if [ $LDFLAGS ]; then
+    echo "-- [INFO] Found LDFLAGS: ${LDFLAGS}, \c"
+    echo "unset it before crossing compiling ${ANDROID_ABI}"
+    unset LDFLAGS
+  fi
+  if [ $CPPFLAGS ]; then
+    echo "-- [INFO] Found CPPFLAGS: ${CPPFLAGS}, \c"
+    echo "unset it before crossing compiling ${ANDROID_ABI}"
+    unset CPPFLAGS
+  fi
+  if [ $CPLUS_INCLUDE_PATH ]; then
+    echo "-- [INFO] Found CPLUS_INCLUDE_PATH: ${CPLUS_INCLUDE_PATH}, \c"
+    echo "unset it before crossing compiling ${ANDROID_ABI}"
+    unset CPLUS_INCLUDE_PATH
+  fi
+  if [ $C_INCLUDE_PATH ]; then
+    echo "-- [INFO] Found C_INCLUDE_PATH: ${C_INCLUDE_PATH}, \c"
+    echo "unset it before crossing compiling ${ANDROID_ABI}"
+    unset C_INCLUDE_PATH
+  fi
+}
+
+__set_android_ndk() {
+  if [ -z $ANDROID_NDK ]; then
+    echo "-- [INFO] ANDROID_NDK not exists, please setup manually ..."
+    exit 0
+  else
+    echo "-- [INFO] Found ANDROID_NDK: ${ANDROID_NDK}"
+  fi
+  if [ "$ANDROID_NDK" ]; then
+      NDK_VERSION=$(echo $ANDROID_NDK | egrep -o "[0-9]{2}" | head -n 1)
+      if [ "$NDK_VERSION" -gt 17 ]; then
+          TOOLCHAIN=clang
+      fi
+      echo "-- [INFO] Checked ndk version: ${NDK_VERSION}"
+      echo "-- [INFO] Selected toolchain: ${TOOLCHAIN}"
+  fi
+}
+
+__build_fastdeploy_android_shared() {
+
+  local ANDROID_STL=c++_shared  # c++_static
+  local ANDROID_TOOLCHAIN=${TOOLCHAIN}
+  local TOOLCHAIN_FILE=${ANDROID_NDK}/build/cmake/android.toolchain.cmake
+  local FASDEPLOY_INSTALL_DIR="${ROOT_PATH}/${BUILD_DIR}/install"
+  cd "${BUILD_DIR}" && echo "-- [INFO] Working Dir: ${PWD}"
+
+  cmake -DCMAKE_TOOLCHAIN_FILE=${TOOLCHAIN_FILE} \
+        -DCMAKE_BUILD_TYPE=MinSizeRel \
+        -DANDROID_ABI=${ANDROID_ABI} \
+        -DANDROID_NDK=${ANDROID_NDK} \
+        -DANDROID_PLATFORM=${ANDROID_PLATFORM} \
+        -DANDROID_STL=${ANDROID_STL} \
+        -DANDROID_TOOLCHAIN=${ANDROID_TOOLCHAIN} \
+        -DENABLE_ORT_BACKEND=OFF \
+        -DENABLE_LITE_BACKEND=ON \
+        -DENABLE_PADDLE_FRONTEND=OFF \
+        -DENABLE_FLYCV=ON \
+        -DENABLE_TEXT=ON \
+        -DENABLE_VISION=ON \
+        -DENABLE_VISION_VISUALIZE=ON \
+        -DBUILD_EXAMPLES=ON \
+        -DWITH_OPENCV_STATIC=OFF \
+        -DWITH_LITE_STATIC=OFF \
+        -DWITH_OPENMP=OFF \
+        -DCMAKE_INSTALL_PREFIX=${FASDEPLOY_INSTALL_DIR} \
+        -Wno-dev ../../.. && make -j8 && make install
+
+  echo "-- [INFO][built][${ANDROID_ABI}][${BUILD_DIR}/install]"
+}
+
+main() {
+  __make_build_dir
+  __check_cxx_envs
+  __set_android_ndk
+  __build_fastdeploy_android_shared
+  exit 0
+}
+
+main
+
+# Usage:
+# ./scripts/android/build_android_cpp_with_text_api.sh arm64-v8a 21
+# ./scripts/android/build_android_cpp_with_text_api.sh armeabi-v7a 21

From 54a8fe0e88ee35e8080c5606e761bd901259790d Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 9 Dec 2022 15:59:16 +0800
Subject: [PATCH 10/77] Update cpu.md

---
 docs/en/build_and_install/cpu.md | 15 ++++++++++++++-
 1 file changed, 14 insertions(+), 1 deletion(-)

diff --git a/docs/en/build_and_install/cpu.md b/docs/en/build_and_install/cpu.md
index f280cce69..bc01fb1f2 100644
--- a/docs/en/build_and_install/cpu.md
+++ b/docs/en/build_and_install/cpu.md
@@ -30,6 +30,11 @@ Prerequisite for Compiling on Linux & Mac:
 - gcc/g++ >= 5.4 (8.2 is recommended)
 - cmake >= 3.18.0
 
+It it recommend install OpenCV library manually, and define `-DOPENCV_DIRECTORY` to set path of OpenCV library(If the flag is not defined, a prebuilt OpenCV library will be downloaded automaticly while building FastDeploy, but the prebuilt OpenCV cannot support reading video file or other function e.g `imshow`)
+```
+sudo apt-get install libopencv-dev
+```
+
 ```
 git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy
@@ -38,7 +43,8 @@ cmake .. -DENABLE_ORT_BACKEND=ON \
          -DENABLE_PADDLE_BACKEND=ON \
          -DENABLE_OPENVINO_BACKEND=ON \
          -DCMAKE_INSTALL_PREFIX=${PWD}/compiled_fastdeploy_sdk \
-         -DENABLE_VISION=ON
+         -DENABLE_VISION=ON \
+         -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
 make -j12
 make install
 ```
@@ -84,6 +90,11 @@ All compilation options are introduced via environment variables
 
 ### Linux & Mac
 
+It it recommend install OpenCV library manually, and define `-DOPENCV_DIRECTORY` to set path of OpenCV library(If the flag is not defined, a prebuilt OpenCV library will be downloaded automaticly while building FastDeploy, but the prebuilt OpenCV cannot support reading video file or other function e.g `imshow`)
+```
+sudo apt-get install libopencv-dev
+```
+
 ```
 git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy/python
@@ -91,6 +102,8 @@ export ENABLE_ORT_BACKEND=ON
 export ENABLE_PADDLE_BACKEND=ON
 export ENABLE_OPENVINO_BACKEND=ON
 export ENABLE_VISION=ON
+# The OPENCV_DIRECTORY is optional, if not exported, a prebuilt OpenCV library will be downloaded
+export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
 
 python setup.py build
 python setup.py bdist_wheel

From ee144090057c728928b2ced0d888e36da3bbea5b Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 9 Dec 2022 16:00:09 +0800
Subject: [PATCH 11/77] Update gpu.md

---
 docs/en/build_and_install/gpu.md | 15 ++++++++++++++-
 1 file changed, 14 insertions(+), 1 deletion(-)

diff --git a/docs/en/build_and_install/gpu.md b/docs/en/build_and_install/gpu.md
index 40357f118..df0645262 100644
--- a/docs/en/build_and_install/gpu.md
+++ b/docs/en/build_and_install/gpu.md
@@ -34,6 +34,11 @@ Prerequisite for Compiling on Linux:
 - cuda >= 11.2
 - cudnn >= 8.2
 
+It it recommend install OpenCV library manually, and define `-DOPENCV_DIRECTORY` to set path of OpenCV library(If the flag is not defined, a prebuilt OpenCV library will be downloaded automaticly while building FastDeploy, but the prebuilt OpenCV cannot support reading video file or other function e.g `imshow`)
+```
+sudo apt-get install libopencv-dev
+```
+
 ```
 git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy
@@ -46,7 +51,8 @@ cmake .. -DENABLE_ORT_BACKEND=ON \
          -DTRT_DIRECTORY=/Paddle/TensorRT-8.4.1.5 \
          -DCUDA_DIRECTORY=/usr/local/cuda \
          -DCMAKE_INSTALL_PREFIX=${PWD}/compiled_fastdeploy_sdk \
-         -DENABLE_VISION=ON
+         -DENABLE_VISION=ON \
+         -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
 make -j12
 make install
 ```
@@ -106,6 +112,11 @@ Prerequisite for Compiling on Linux:
 
 All compilation options are imported via environment variables
 
+It it recommend install OpenCV library manually, and define `-DOPENCV_DIRECTORY` to set path of OpenCV library(If the flag is not defined, a prebuilt OpenCV library will be downloaded automaticly while building FastDeploy, but the prebuilt OpenCV cannot support reading video file or other function e.g `imshow`)
+```
+sudo apt-get install libopencv-dev
+```
+
 ```
 git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy/python
@@ -117,6 +128,8 @@ export ENABLE_TRT_BACKEND=ON
 export WITH_GPU=ON
 export TRT_DIRECTORY=/Paddle/TensorRT-8.4.1.5
 export CUDA_DIRECTORY=/usr/local/cuda
+# The OPENCV_DIRECTORY is optional, if not exported, a prebuilt OpenCV library will be downloaded
+export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
 
 python setup.py build
 python setup.py bdist_wheel

From 24327044e99ee9e6d3062ce49994124df4b8b8a3 Mon Sep 17 00:00:00 2001
From: DefTruth <31974251+DefTruth@users.noreply.github.com>
Date: Fri, 9 Dec 2022 17:40:57 +0800
Subject: [PATCH 12/77] [cmake] Update paddlelite.cmake (#845)

Update paddlelite.cmake
---
 cmake/paddlelite.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmake/paddlelite.cmake b/cmake/paddlelite.cmake
index 299843a6d..bcc0eb470 100755
--- a/cmake/paddlelite.cmake
+++ b/cmake/paddlelite.cmake
@@ -58,7 +58,7 @@ elseif(ANDROID)
   endif()  
 else() # Linux
   if(CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "aarch64")
-    set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-linux-arm64-20220920.tgz")
+    set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-linux-arm64-20221209.tgz")
   else()
     if(ENABLE_TIMVX)
       set(PADDLELITE_URL "https://bj.bcebos.com/fastdeploy/test/lite-linux_armhf_1130.tgz")

From 035e51e6a4865ef615fba0f26651310bc7ee93aa Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 9 Dec 2022 17:48:28 +0800
Subject: [PATCH 13/77] Update jetson.md

---
 docs/cn/build_and_install/jetson.md | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/docs/cn/build_and_install/jetson.md b/docs/cn/build_and_install/jetson.md
index f60aa280c..43a3bb51e 100644
--- a/docs/cn/build_and_install/jetson.md
+++ b/docs/cn/build_and_install/jetson.md
@@ -10,12 +10,17 @@ FastDeploy当前在Jetson仅支持ONNX Runtime CPU和TensorRT GPU两种后端推
 - cmake >= 3.10.0
 - jetpack >= 4.6.1
 
+
+如果需要集成Paddle Inference后端，在[Paddle Inference预编译库](https://www.paddlepaddle.org.cn/inference/v2.4/guides/install/download_lib.html#c)页面根据开发环境选择对应的Jetpack C++包下载，并解压。
+
 ```bash
 git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy
 mkdir build && cd build
 cmake .. -DBUILD_ON_JETSON=ON \
          -DENABLE_VISION=ON \
+         -DENABLE_PADDLE_BACKEND=ON \
+         -DPADDLEINFERENCE_DIRECTORY=/Download/paddle_inference_jetson \
          -DCMAKE_INSTALL_PREFIX=${PWD}/installed_fastdeploy
 make -j8
 make install
@@ -34,6 +39,8 @@ make install
 
 Python打包依赖`wheel`，编译前请先执行`pip install wheel`
 
+如果需要集成Paddle Inference后端，在[Paddle Inference预编译库](https://www.paddlepaddle.org.cn/inference/v2.4/guides/install/download_lib.html#c)页面根据开发环境选择对应的Jetpack C++包下载，并解压。
+
 所有编译选项通过环境变量导入
 
 ```bash
@@ -41,6 +48,8 @@ git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy/python
 export BUILD_ON_JETSON=ON
 export ENABLE_VISION=ON
+export ENABLE_PADDLE_BACKEND=ON
+export PADDLEINFERENCE_DIRECTORY=/Download/paddle_inference_jetson
 
 python setup.py build
 python setup.py bdist_wheel

From 924d0e0e7b7077f5d2b3f24a07d1e5da39258817 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 9 Dec 2022 17:52:08 +0800
Subject: [PATCH 14/77] Update jetson.md

---
 docs/en/build_and_install/jetson.md | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/docs/en/build_and_install/jetson.md b/docs/en/build_and_install/jetson.md
index e606b6d29..8d16f3149 100644
--- a/docs/en/build_and_install/jetson.md
+++ b/docs/en/build_and_install/jetson.md
@@ -1,7 +1,7 @@
 
 # How to Build FastDeploy Library on Nvidia Jetson Platform
 
-FastDeploy supports CPU inference with ONNX Runtime and GPU inference with Nvidia TensorRT on Nvidia Jetson platform
+FastDeploy supports CPU inference with ONNX Runtime and GPU inference with Nvidia TensorRT/Paddle Inference on Nvidia Jetson platform
 
 ## How to Build and Install FastDeploy C++ Library
 
@@ -11,12 +11,16 @@ Prerequisite for Compiling on NVIDIA Jetson:
 - cmake >= 3.10.0
 - jetpack >= 4.6.1
 
+If you need to integrate Paddle Inference backend(Support CPU/GPU)，please download and decompress the prebuilt library in [Paddle Inference prebuild libraries](https://www.paddlepaddle.org.cn/inference/v2.4/guides/install/download_lib.html#c) according to your develop envriment.
+
 ```
 git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy
 mkdir build && cd build
 cmake .. -DBUILD_ON_JETSON=ON \
          -DENABLE_VISION=ON \
+         -DENABLE_PADDLE_BACKEND=ON \ # This is optional, can be OFF if you don't need
+         -DPADDLEINFERENCE_DIRECTORY=/Download/paddle_inference_jetson \
          -DCMAKE_INSTALL_PREFIX=${PWD}/installed_fastdeploy
 make -j8
 make install
@@ -35,6 +39,8 @@ Prerequisite for Compiling on NVIDIA Jetson:
 
 Notice the `wheel` is required if you need to pack a wheel, execute `pip install wheel` first.
 
+If you need to integrate Paddle Inference backend(Support CPU/GPU)，please download and decompress the prebuilt library in [Paddle Inference prebuild libraries](https://www.paddlepaddle.org.cn/inference/v2.4/guides/install/download_lib.html#c) according to your develop envriment.
+
 All compilation options are imported via environment variables
 
 ```
@@ -43,6 +49,10 @@ cd FastDeploy/python
 export BUILD_ON_JETSON=ON
 export ENABLE_VISION=ON
 
+# ENABLE_PADDLE_BACKEND & PADDLEINFERENCE_DIRECTORY are optional
+export ENABLE_PADDLE_BACKEND=ON
+export PADDLEINFERENCE_DIRECTORY=/Download/paddle_inference_jetson
+
 python setup.py build
 python setup.py bdist_wheel
 ```

From 6f5521e63e1bc59999dba47797bc0238016f5ae5 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 9 Dec 2022 17:53:04 +0800
Subject: [PATCH 15/77] Update jetson.md

---
 docs/cn/build_and_install/jetson.md | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/docs/cn/build_and_install/jetson.md b/docs/cn/build_and_install/jetson.md
index 43a3bb51e..97ab59083 100644
--- a/docs/cn/build_and_install/jetson.md
+++ b/docs/cn/build_and_install/jetson.md
@@ -1,7 +1,7 @@
 
 # Jetson部署库编译
 
-FastDeploy当前在Jetson仅支持ONNX Runtime CPU和TensorRT GPU两种后端推理
+FastDeploy当前在Jetson仅支持ONNX Runtime CPU和TensorRT GPU/Paddle Inference两种后端推理
 
 ## C++ SDK编译安装
 
@@ -19,7 +19,7 @@ cd FastDeploy
 mkdir build && cd build
 cmake .. -DBUILD_ON_JETSON=ON \
          -DENABLE_VISION=ON \
-         -DENABLE_PADDLE_BACKEND=ON \
+         -DENABLE_PADDLE_BACKEND=ON \ # 可选项，如若不需要Paddle Inference后端，可关闭
          -DPADDLEINFERENCE_DIRECTORY=/Download/paddle_inference_jetson \
          -DCMAKE_INSTALL_PREFIX=${PWD}/installed_fastdeploy
 make -j8
@@ -48,6 +48,8 @@ git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd FastDeploy/python
 export BUILD_ON_JETSON=ON
 export ENABLE_VISION=ON
+
+# ENABLE_PADDLE_BACKEND & PADDLEINFERENCE_DIRECTORY为可选项
 export ENABLE_PADDLE_BACKEND=ON
 export PADDLEINFERENCE_DIRECTORY=/Download/paddle_inference_jetson
 

From c7dc7d5eeea2ecc461d7015284a256b61b6f87ce Mon Sep 17 00:00:00 2001
From: Zheng_Bicheng <58363586+Zheng-Bicheng@users.noreply.github.com>
Date: Sat, 10 Dec 2022 15:44:00 +0800
Subject: [PATCH 16/77] Add RKYOLOv5 RKYOLOX RKYOLOV7 (#709)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* 更正代码格式

* 更正代码格式

* 修复语法错误

* fix rk error

* update

* update

* update

* update

* update

* update

* update

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 .../paddledetection/rknpu2/README.md          |   2 +
 examples/vision/detection/rkyolo/README.md    |  18 ++
 .../detection/rkyolo/cpp/CMakeLists.txt       |  37 +++
 .../vision/detection/rkyolo/cpp/README.md     |  69 +++++
 .../detection/rkyolo/cpp/infer_rkyolo.cc      |  53 ++++
 .../vision/detection/rkyolo/python/README.md  |  34 +++
 .../vision/detection/rkyolo/python/infer.py   |  53 ++++
 .../backends/rknpu/rknpu2/rknpu2_backend.cc   |   7 +-
 fastdeploy/core/fd_tensor.cc                  |  10 +
 fastdeploy/core/fd_tensor.h                   |   5 +
 fastdeploy/vision.h                           |   1 +
 .../vision/detection/contrib/rknpu2/model.h   |  92 +++++++
 .../detection/contrib/rknpu2/postprocessor.cc | 239 ++++++++++++++++++
 .../detection/contrib/rknpu2/postprocessor.h  | 105 ++++++++
 .../detection/contrib/rknpu2/preprocessor.cc  | 127 ++++++++++
 .../detection/contrib/rknpu2/preprocessor.h   | 100 ++++++++
 .../vision/detection/contrib/rknpu2/rkyolo.cc |  73 ++++++
 .../vision/detection/contrib/rknpu2/rkyolo.h  |  64 +++++
 .../detection/contrib/rknpu2/rkyolo_pybind.cc |  95 +++++++
 .../vision/detection/contrib/rknpu2/utils.cc  |  93 +++++++
 .../vision/detection/contrib/rknpu2/utils.h   |  26 ++
 .../vision/detection/detection_pybind.cc      |   2 +
 .../fastdeploy/vision/detection/__init__.py   |   1 +
 .../detection/contrib/rkyolo/__init__.py      |  16 ++
 .../detection/contrib/rkyolo/rkyolov5.py      | 195 ++++++++++++++
 25 files changed, 1516 insertions(+), 1 deletion(-)
 create mode 100644 examples/vision/detection/rkyolo/README.md
 create mode 100644 examples/vision/detection/rkyolo/cpp/CMakeLists.txt
 create mode 100644 examples/vision/detection/rkyolo/cpp/README.md
 create mode 100644 examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
 create mode 100644 examples/vision/detection/rkyolo/python/README.md
 create mode 100644 examples/vision/detection/rkyolo/python/infer.py
 create mode 100644 fastdeploy/vision/detection/contrib/rknpu2/model.h
 create mode 100755 fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
 create mode 100755 fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
 create mode 100755 fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
 create mode 100755 fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h
 create mode 100644 fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
 create mode 100644 fastdeploy/vision/detection/contrib/rknpu2/rkyolo.h
 create mode 100755 fastdeploy/vision/detection/contrib/rknpu2/rkyolo_pybind.cc
 create mode 100644 fastdeploy/vision/detection/contrib/rknpu2/utils.cc
 create mode 100644 fastdeploy/vision/detection/contrib/rknpu2/utils.h
 create mode 100644 python/fastdeploy/vision/detection/contrib/rkyolo/__init__.py
 create mode 100644 python/fastdeploy/vision/detection/contrib/rkyolo/rkyolov5.py

diff --git a/examples/vision/detection/paddledetection/rknpu2/README.md b/examples/vision/detection/paddledetection/rknpu2/README.md
index d5f339db5..98f1ada10 100644
--- a/examples/vision/detection/paddledetection/rknpu2/README.md
+++ b/examples/vision/detection/paddledetection/rknpu2/README.md
@@ -113,5 +113,7 @@ Preprocess:
   type: Resize
 ```
 
+## 其他链接
+- [Cpp部署](./cpp)
 - [Python部署](./python)
 - [视觉模型预测结果](../../../../../docs/api/vision_results/)
diff --git a/examples/vision/detection/rkyolo/README.md b/examples/vision/detection/rkyolo/README.md
new file mode 100644
index 000000000..015e22506
--- /dev/null
+++ b/examples/vision/detection/rkyolo/README.md
@@ -0,0 +1,18 @@
+# RKYOLO准备部署模型
+
+RKYOLO参考[rknn_model_zoo](https://github.com/airockchip/rknn_model_zoo/tree/main/models/CV/object_detection/yolo)的代码
+对RKYOLO系列模型进行了封装，目前支持RKYOLOV5系列模型的部署。
+
+## 支持模型列表
+
+* RKYOLOV5
+
+## 模型转换example
+
+请参考[RKNN_model_convert](https://github.com/airockchip/rknn_model_zoo/tree/main/models/CV/object_detection/yolo/RKNN_model_convert)
+
+
+## 其他链接
+- [Cpp部署](./cpp)
+- [Python部署](./python)
+- [视觉模型预测结果](../../../../docs/api/vision_results/)
diff --git a/examples/vision/detection/rkyolo/cpp/CMakeLists.txt b/examples/vision/detection/rkyolo/cpp/CMakeLists.txt
new file mode 100644
index 000000000..524b94fea
--- /dev/null
+++ b/examples/vision/detection/rkyolo/cpp/CMakeLists.txt
@@ -0,0 +1,37 @@
+CMAKE_MINIMUM_REQUIRED(VERSION 3.10)
+project(rknpu2_test)
+
+set(CMAKE_CXX_STANDARD 14)
+
+# 指定下载解压后的fastdeploy库路径
+set(FASTDEPLOY_INSTALL_DIR "thirdpartys/fastdeploy-0.0.3")
+
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeployConfig.cmake)
+include_directories(${FastDeploy_INCLUDE_DIRS})
+
+add_executable(infer_rkyolo infer_rkyolo.cc)
+target_link_libraries(infer_rkyolo ${FastDeploy_LIBS})
+
+
+
+set(CMAKE_INSTALL_PREFIX ${CMAKE_SOURCE_DIR}/build/install)
+
+install(TARGETS infer_rkyolo DESTINATION ./)
+
+install(DIRECTORY model DESTINATION ./)
+install(DIRECTORY images DESTINATION ./)
+
+file(GLOB FASTDEPLOY_LIBS ${FASTDEPLOY_INSTALL_DIR}/lib/*)
+message("${FASTDEPLOY_LIBS}")
+install(PROGRAMS ${FASTDEPLOY_LIBS} DESTINATION lib)
+
+file(GLOB ONNXRUNTIME_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/onnxruntime/lib/*)
+install(PROGRAMS ${ONNXRUNTIME_LIBS} DESTINATION lib)
+
+install(DIRECTORY ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/opencv/lib DESTINATION ./)
+
+file(GLOB PADDLETOONNX_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddle2onnx/lib/*)
+install(PROGRAMS ${PADDLETOONNX_LIBS} DESTINATION lib)
+
+file(GLOB RKNPU2_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/rknpu2_runtime/${RKNN2_TARGET_SOC}/lib/*)
+install(PROGRAMS ${RKNPU2_LIBS} DESTINATION lib)
diff --git a/examples/vision/detection/rkyolo/cpp/README.md b/examples/vision/detection/rkyolo/cpp/README.md
new file mode 100644
index 000000000..16f8df72d
--- /dev/null
+++ b/examples/vision/detection/rkyolo/cpp/README.md
@@ -0,0 +1,69 @@
+# RKYOLO C++部署示例
+
+本目录下提供`infer_xxxxx.cc`快速完成RKYOLO模型在Rockchip板子上上通过二代NPU加速部署的示例。
+
+在部署前，需确认以下两个步骤:
+
+1. 软硬件环境满足要求
+2. 根据开发环境，下载预编译部署库或者从头编译FastDeploy仓库
+
+以上步骤请参考[RK2代NPU部署库编译](../../../../../docs/cn/build_and_install/rknpu2.md)实现
+
+## 生成基本目录文件
+
+该例程由以下几个部分组成
+```text
+.
+├── CMakeLists.txt
+├── build  # 编译文件夹
+├── image  # 存放图片的文件夹
+├── infer_rkyolo.cc
+├── model  # 存放模型文件的文件夹
+└── thirdpartys  # 存放sdk的文件夹
+```
+
+首先需要先生成目录结构
+```bash
+mkdir build
+mkdir images
+mkdir model
+mkdir thirdpartys
+```
+
+## 编译
+
+### 编译并拷贝SDK到thirdpartys文件夹
+
+请参考[RK2代NPU部署库编译](../../../../../../docs/cn/build_and_install/rknpu2.md)仓库编译SDK，编译完成后，将在build目录下生成
+fastdeploy-0.0.3目录，请移动它至thirdpartys目录下.
+
+### 拷贝模型文件，以及配置文件至model文件夹
+在Paddle动态图模型 -> Paddle静态图模型 -> ONNX模型的过程中，将生成ONNX文件以及对应的yaml配置文件，请将配置文件存放到model文件夹内。
+转换为RKNN后的模型文件也需要拷贝至model。
+
+### 准备测试图片至image文件夹
+```bash
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+cp 000000014439.jpg ./images
+```
+
+### 编译example
+
+```bash
+cd build
+cmake ..
+make -j8
+make install
+```
+
+## 运行例程
+
+```bash
+cd ./build/install
+./infer_picodet model/ images/000000014439.jpg
+```
+
+
+- [模型介绍](../../)
+- [Python部署](../python)
+- [视觉模型预测结果](../../../../../../docs/api/vision_results/)
diff --git a/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc b/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
new file mode 100644
index 000000000..c7c1be43b
--- /dev/null
+++ b/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
@@ -0,0 +1,53 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#include "fastdeploy/vision.h"
+
+void RKNPU2Infer(const std::string& model_file, const std::string& image_file) {
+  struct timeval start_time, stop_time;
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseRKNPU2();
+
+  auto format = fastdeploy::ModelFormat::RKNN;
+
+  auto model = fastdeploy::vision::detection::RKYOLOV5(
+      model_file, option,format);
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im, res,0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 3) {
+    std::cout
+        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
+           "e.g ./infer_model ./picodet_model_dir ./test.jpeg"
+        << std::endl;
+    return -1;
+  }
+
+  RKNPU2Infer(argv[1], argv[2]);
+
+  return 0;
+}
+
diff --git a/examples/vision/detection/rkyolo/python/README.md b/examples/vision/detection/rkyolo/python/README.md
new file mode 100644
index 000000000..4549ec0f9
--- /dev/null
+++ b/examples/vision/detection/rkyolo/python/README.md
@@ -0,0 +1,34 @@
+# RKYOLO Python部署示例
+
+在部署前，需确认以下两个步骤
+
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../../docs/cn/build_and_install/rknpu2.md)
+
+本目录下提供`infer.py`快速完成Picodet在RKNPU上部署的示例。执行如下脚本即可完成
+
+```bash
+# 下载部署示例代码
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/examples/vision/detection/rkyolo/python
+
+# 下载图片
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+
+# copy model
+cp -r ./model /path/to/FastDeploy/examples/vision/detection/rkyolo/python
+
+# 推理
+python3 infer.py --model_file ./model/  \
+                  --image 000000014439.jpg
+```
+
+
+## 注意事项
+RKNPU上对模型的输入要求是使用NHWC格式，且图片归一化操作会在转RKNN模型时，内嵌到模型中，因此我们在使用FastDeploy部署时，
+
+## 其它文档
+
+- [PaddleDetection 模型介绍](..)
+- [PaddleDetection C++部署](../cpp)
+- [模型预测结果说明](../../../../../../docs/api/vision_results/)
+- [转换PaddleDetection RKNN模型文档](../README.md)
diff --git a/examples/vision/detection/rkyolo/python/infer.py b/examples/vision/detection/rkyolo/python/infer.py
new file mode 100644
index 000000000..38eea0e8c
--- /dev/null
+++ b/examples/vision/detection/rkyolo/python/infer.py
@@ -0,0 +1,53 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import fastdeploy as fd
+import cv2
+import os
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model_file", required=True, help="Path of rknn model.")
+    parser.add_argument(
+        "--image", type=str, required=True, help="Path of test image file.")
+    return parser.parse_args()
+
+
+if __name__ == "__main__":
+    args = parse_arguments()
+
+    model_file = args.model_file
+    params_file = ""
+
+    # 配置runtime，加载模型
+    runtime_option = fd.RuntimeOption()
+    runtime_option.use_rknpu2()
+
+    model = fd.vision.detection.RKYOLOV5(
+        model_file,
+        runtime_option=runtime_option,
+        model_format=fd.ModelFormat.RKNN)
+
+    # 预测图片分割结果
+    im = cv2.imread(args.image)
+    result = model.predict(im)
+    print(result)
+
+    # 可视化结果
+    vis_im = fd.vision.vis_detection(im, result, score_threshold=0.5)
+    cv2.imwrite("visualized_result.jpg", vis_im)
+    print("Visualized result save in ./visualized_result.jpg")
diff --git a/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc b/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
index 16edf7561..b577c2791 100644
--- a/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
+++ b/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
@@ -190,6 +190,8 @@ bool RKNPU2Backend::GetModelInputOutputInfos() {
       FDERROR << "rknpu2_backend only support input format is NHWC or UNDEFINED" << std::endl;
     }
 
+    DumpTensorAttr(input_attrs_[i]);
+
     // copy input_attrs_ to input tensor info
     std::string temp_name = input_attrs_[i].name;
     std::vector<int> temp_shape{};
@@ -234,6 +236,8 @@ bool RKNPU2Backend::GetModelInputOutputInfos() {
                 << std::endl;
     }
 
+    DumpTensorAttr(output_attrs_[i]);
+
     // copy output_attrs_ to output tensor
     std::string temp_name = output_attrs_[i].name;
     std::vector<int> temp_shape{};
@@ -342,7 +346,6 @@ bool RKNPU2Backend::Infer(std::vector<FDTensor>& inputs,
         return false;
       }
       // default output type is depend on model, this requires float32 to compute top5
-      output_attrs_[i].type = RKNN_TENSOR_FLOAT32;
       ret = rknn_set_io_mem(ctx, output_mems_[i], &output_attrs_[i]);
       // set output memory and attribute
       if (ret != RKNN_SUCC) {
@@ -389,6 +392,8 @@ bool RKNPU2Backend::Infer(std::vector<FDTensor>& inputs,
     }
     (*outputs)[i].Resize(temp_shape, outputs_desc_[i].dtype,
                          outputs_desc_[i].name);
+    std::vector<float>  output_scale = {output_attrs_[i].scale};
+    (*outputs)[i].SetQuantizationInfo(output_attrs_[i].zp, output_scale);
     memcpy((*outputs)[i].MutableData(), (float*)output_mems_[i]->virt_addr,
            (*outputs)[i].Nbytes());
   }
diff --git a/fastdeploy/core/fd_tensor.cc b/fastdeploy/core/fd_tensor.cc
index e84535ac9..484e03913 100644
--- a/fastdeploy/core/fd_tensor.cc
+++ b/fastdeploy/core/fd_tensor.cc
@@ -138,6 +138,11 @@ void FDTensor::Resize(const std::vector<int64_t>& new_shape) {
   external_data_ptr = nullptr;
 }
 
+void FDTensor::SetQuantizationInfo(int32_t zero_point,std::vector<float>& scale){
+  quantized_parameter_.first = zero_point;
+  quantized_parameter_.second = scale;
+}
+
 void FDTensor::Resize(const std::vector<int64_t>& new_shape,
                       const FDDataType& data_type,
                       const std::string& tensor_name,
@@ -450,4 +455,9 @@ FDTensor& FDTensor::operator=(FDTensor&& other) {
   return *this;
 }
 
+const std::pair<int32_t, std::vector<float>>
+FDTensor::GetQuantizationInfo() const{
+  return quantized_parameter_;
+}
+
 }  // namespace fastdeploy
diff --git a/fastdeploy/core/fd_tensor.h b/fastdeploy/core/fd_tensor.h
index 3c79b0c88..e3e373c43 100644
--- a/fastdeploy/core/fd_tensor.h
+++ b/fastdeploy/core/fd_tensor.h
@@ -25,6 +25,11 @@
 namespace fastdeploy {
 
 struct FASTDEPLOY_DECL FDTensor {
+  // These two parameters are general parameters of quantitative model.
+  std::pair<int32_t, std::vector<float>> quantized_parameter_ = {0, {0}};
+  void SetQuantizationInfo(int32_t zero_point, std::vector<float>& scale);
+  const std::pair<int32_t, std::vector<float>> GetQuantizationInfo() const;
+
   // std::vector<int8_t> data;
   void* buffer_ = nullptr;
   std::vector<int64_t> shape = {0};
diff --git a/fastdeploy/vision.h b/fastdeploy/vision.h
index 9bea1550e..5ccaeb2dd 100644
--- a/fastdeploy/vision.h
+++ b/fastdeploy/vision.h
@@ -28,6 +28,7 @@
 #include "fastdeploy/vision/detection/contrib/yolov7end2end_ort.h"
 #include "fastdeploy/vision/detection/contrib/yolov7end2end_trt.h"
 #include "fastdeploy/vision/detection/contrib/yolox.h"
+#include "fastdeploy/vision/detection/contrib/rknpu2/model.h"
 #include "fastdeploy/vision/detection/ppdet/model.h"
 #include "fastdeploy/vision/facealign/contrib/face_landmark_1000.h"
 #include "fastdeploy/vision/facealign/contrib/pfld.h"
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/model.h b/fastdeploy/vision/detection/contrib/rknpu2/model.h
new file mode 100644
index 000000000..9a0fd423d
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/model.h
@@ -0,0 +1,92 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+#include "fastdeploy/vision/detection/contrib/rknpu2/rkyolo.h"
+namespace fastdeploy {
+namespace vision {
+namespace detection {
+
+class FASTDEPLOY_DECL RKYOLOV5 : public RKYOLO {
+ public:
+  /** \brief Set path of model file and configuration file, and the configuration of runtime
+   *
+   * \param[in] model_file Path of model file, e.g picodet/model.pdmodel
+   * \param[in] params_file Path of parameter file, e.g picodet/model.pdiparams, if the model format is ONNX, this parameter will be ignored
+   * \param[in] config_file Path of configuration file for deployment, e.g picodet/infer_cfg.yml
+   * \param[in] custom_option RuntimeOption for inference, the default will use cpu, and choose the backend defined in `valid_cpu_backends`
+   * \param[in] model_format Model format of the loaded model, default is Paddle format
+   */
+  RKYOLOV5(const std::string& model_file,
+           const RuntimeOption& custom_option = RuntimeOption(),
+           const ModelFormat& model_format = ModelFormat::RKNN)
+      : RKYOLO(model_file, custom_option, model_format) {
+    valid_cpu_backends = {};
+    valid_gpu_backends = {};
+    valid_rknpu_backends = {Backend::RKNPU2};
+    GetPostprocessor().SetModelType(ModelType::RKYOLOV5);
+  }
+
+  virtual std::string ModelName() const { return "RKYOLOV5"; }
+};
+
+class FASTDEPLOY_DECL RKYOLOV7 : public RKYOLO {
+ public:
+  /** \brief Set path of model file and configuration file, and the configuration of runtime
+   *
+   * \param[in] model_file Path of model file, e.g picodet/model.pdmodel
+   * \param[in] params_file Path of parameter file, e.g picodet/model.pdiparams, if the model format is ONNX, this parameter will be ignored
+   * \param[in] config_file Path of configuration file for deployment, e.g picodet/infer_cfg.yml
+   * \param[in] custom_option RuntimeOption for inference, the default will use cpu, and choose the backend defined in `valid_cpu_backends`
+   * \param[in] model_format Model format of the loaded model, default is Paddle format
+   */
+  RKYOLOV7(const std::string& model_file,
+           const RuntimeOption& custom_option = RuntimeOption(),
+           const ModelFormat& model_format = ModelFormat::RKNN)
+      : RKYOLO(model_file, custom_option, model_format) {
+    valid_cpu_backends = {};
+    valid_gpu_backends = {};
+    valid_rknpu_backends = {Backend::RKNPU2};
+    GetPostprocessor().SetModelType(ModelType::RKYOLOV7);
+  }
+
+  virtual std::string ModelName() const { return "RKYOLOV7"; }
+};
+
+class FASTDEPLOY_DECL RKYOLOX : public RKYOLO {
+ public:
+  /** \brief Set path of model file and configuration file, and the configuration of runtime
+   *
+   * \param[in] model_file Path of model file, e.g picodet/model.pdmodel
+   * \param[in] params_file Path of parameter file, e.g picodet/model.pdiparams, if the model format is ONNX, this parameter will be ignored
+   * \param[in] config_file Path of configuration file for deployment, e.g picodet/infer_cfg.yml
+   * \param[in] custom_option RuntimeOption for inference, the default will use cpu, and choose the backend defined in `valid_cpu_backends`
+   * \param[in] model_format Model format of the loaded model, default is Paddle format
+   */
+  RKYOLOX(const std::string& model_file,
+           const RuntimeOption& custom_option = RuntimeOption(),
+           const ModelFormat& model_format = ModelFormat::RKNN)
+      : RKYOLO(model_file, custom_option, model_format) {
+    valid_cpu_backends = {};
+    valid_gpu_backends = {};
+    valid_rknpu_backends = {Backend::RKNPU2};
+    GetPostprocessor().SetModelType(ModelType::RKYOLOX);
+  }
+
+  virtual std::string ModelName() const { return "RKYOLOV7"; }
+};
+
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
new file mode 100755
index 000000000..bb46eff5c
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
@@ -0,0 +1,239 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h"
+#include "fastdeploy/vision/utils/utils.h"
+
+namespace fastdeploy {
+namespace vision {
+namespace detection {
+
+RKYOLOPostprocessor::RKYOLOPostprocessor() {}
+
+void RKYOLOPostprocessor::SetModelType(ModelType model_type) {
+  model_type_ = model_type;
+  if (model_type == RKYOLOV5) {
+    anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
+                45, 59, 119, 116, 90, 156, 198, 373, 326};
+    anchor_per_branch_ = 3;
+  } else if (model_type == RKYOLOX) {
+    anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
+                45, 59, 119, 116, 90, 156, 198, 373, 326};
+    anchor_per_branch_ = 1;
+  } else if (model_type == RKYOLOV7) {
+    anchors_ = {12, 16, 19,  36,  40,  28,  36,  75,  76,
+                55, 72, 146, 142, 110, 192, 243, 459, 401};
+    anchor_per_branch_ = 3;
+  } else {
+    return;
+  }
+}
+
+bool RKYOLOPostprocessor::Run(const std::vector<FDTensor>& tensors,
+                              std::vector<DetectionResult>* results) {
+  if (model_type_ == ModelType::UNKNOWN) {
+    FDERROR << "RKYOLO Only Support YOLOV5,YOLOV7,YOLOX" << std::endl;
+    return false;
+  }
+
+  results->resize(tensors[0].shape[0]);
+  for (int num = 0; num < tensors[0].shape[0]; ++num) {
+    int validCount = 0;
+    std::vector<float> filterBoxes;
+    std::vector<float> boxesScore;
+    std::vector<int> classId;
+    for (int i = 0; i < tensors.size(); i++) {
+      auto tensor_shape = tensors[i].shape;
+      auto skip_num = std::accumulate(tensor_shape.begin(), tensor_shape.end(),
+                                      1, std::multiplies<int>());
+      int skip_address = num * skip_num;
+      int stride = strides_[i];
+      int grid_h = height_ / stride;
+      int grid_w = width_ / stride;
+      int* anchor = &(anchors_.data()[i * 2 * anchor_per_branch_]);
+      if (tensors[i].dtype == FDDataType::INT8 || tensors[i].dtype == FDDataType::UINT8) {
+        auto quantization_info = tensors[i].GetQuantizationInfo();
+        validCount = validCount +
+                     ProcessInt8((int8_t*)tensors[i].Data() + skip_address,
+                                 anchor, grid_h, grid_w, stride, filterBoxes,
+                                 boxesScore, classId, conf_threshold_,
+                                 quantization_info.first, quantization_info.second[0]);
+      } else {
+        FDERROR << "RKYOLO Only Support INT8 Model" << std::endl;
+      }
+    }
+
+    // no object detect
+    if (validCount <= 0) {
+      FDINFO << "The number of object detect is 0." << std::endl;
+      return true;
+    }
+
+    std::vector<int> indexArray;
+    for (int i = 0; i < validCount; ++i) {
+      indexArray.push_back(i);
+    }
+
+    QuickSortIndiceInverse(boxesScore, 0, validCount - 1, indexArray);
+
+    if (model_type_ == RKYOLOV5 || model_type_ == RKYOLOV7) {
+      NMS(validCount, filterBoxes, classId, indexArray, nms_threshold_, false);
+    } else if (model_type_ == RKYOLOX) {
+      NMS(validCount, filterBoxes, classId, indexArray, nms_threshold_, true);
+    }
+
+    int last_count = 0;
+    (*results)[num].Clear();
+    (*results)[num].Reserve(validCount);
+
+    /* box valid detect target */
+    for (int i = 0; i < validCount; ++i) {
+      if (indexArray[i] == -1 || boxesScore[i] < conf_threshold_ ||
+          last_count >= obj_num_bbox_max_size) {
+        continue;
+      }
+      int n = indexArray[i];
+      float x1 = filterBoxes[n * 4 + 0];
+      float y1 = filterBoxes[n * 4 + 1];
+      float x2 = x1 + filterBoxes[n * 4 + 2];
+      float y2 = y1 + filterBoxes[n * 4 + 3];
+      int id = classId[n];
+      (*results)[num].boxes.emplace_back(std::array<float, 4>{
+          (float)((clamp(x1, 0, width_) - pad_hw_values_[num][1] / 2) /
+                  scale_[num]),
+          (float)((clamp(y1, 0, height_) - pad_hw_values_[num][0] / 2) /
+                  scale_[num]),
+          (float)((clamp(x2, 0, width_) - pad_hw_values_[num][1] / 2) /
+                  scale_[num]),
+          (float)((clamp(y2, 0, height_) - pad_hw_values_[num][0] / 2) /
+                  scale_[0])});
+      (*results)[num].label_ids.push_back(id);
+      (*results)[num].scores.push_back(boxesScore[i]);
+      last_count++;
+    }
+    std::cout << "last_count" << last_count << std::endl;
+  }
+  return true;
+}
+
+int RKYOLOPostprocessor::ProcessInt8(int8_t* input, int* anchor, int grid_h,
+                                     int grid_w, int stride,
+                                     std::vector<float>& boxes,
+                                     std::vector<float>& boxScores,
+                                     std::vector<int>& classId, float threshold,
+                                     int32_t zp, float scale) {
+  int validCount = 0;
+  int grid_len = grid_h * grid_w;
+  float thres = threshold;
+  auto thres_i8 = QntF32ToAffine(thres, zp, scale);
+  for (int a = 0; a < anchor_per_branch_; a++) {
+    for (int i = 0; i < grid_h; i++) {
+      for (int j = 0; j < grid_w; j++) {
+        int8_t box_confidence =
+            input[(prob_box_size * a + 4) * grid_len + i * grid_w + j];
+        if (box_confidence >= thres_i8) {
+          int offset = (prob_box_size * a) * grid_len + i * grid_w + j;
+          int8_t* in_ptr = input + offset;
+
+          int8_t maxClassProbs = in_ptr[5 * grid_len];
+          int maxClassId = 0;
+          for (int k = 1; k < obj_class_num; ++k) {
+            int8_t prob = in_ptr[(5 + k) * grid_len];
+            if (prob > maxClassProbs) {
+              maxClassId = k;
+              maxClassProbs = prob;
+            }
+          }
+
+          float box_conf_f32 = DeqntAffineToF32(box_confidence, zp, scale);
+          float class_prob_f32 = DeqntAffineToF32(maxClassProbs, zp, scale);
+          float limit_score = 0;
+          if (model_type_ == RKYOLOX) {
+            limit_score = box_conf_f32 * class_prob_f32;
+          } else {
+            limit_score = class_prob_f32;
+          }
+          //printf("limit score: %f\n", limit_score);
+          if (limit_score > conf_threshold_) {
+            float box_x, box_y, box_w, box_h;
+            if (model_type_ == RKYOLOX) {
+              box_x = DeqntAffineToF32(*in_ptr, zp, scale);
+              box_y = DeqntAffineToF32(in_ptr[grid_len], zp, scale);
+              box_w = DeqntAffineToF32(in_ptr[2 * grid_len], zp, scale);
+              box_h = DeqntAffineToF32(in_ptr[3 * grid_len], zp, scale);
+              box_w = exp(box_w) * stride;
+              box_h = exp(box_h) * stride;
+            } else {
+              box_x = DeqntAffineToF32(*in_ptr, zp, scale) * 2.0 - 0.5;
+              box_y = DeqntAffineToF32(in_ptr[grid_len], zp, scale) * 2.0 - 0.5;
+              box_w = DeqntAffineToF32(in_ptr[2 * grid_len], zp, scale) * 2.0;
+              box_h = DeqntAffineToF32(in_ptr[3 * grid_len], zp, scale) * 2.0;
+              box_w = box_w * box_w;
+              box_h = box_h * box_h;
+            }
+            box_x = (box_x + j) * (float)stride;
+            box_y = (box_y + i) * (float)stride;
+            box_w *= (float)anchor[a * 2];
+            box_h *= (float)anchor[a * 2 + 1];
+            box_x -= (box_w / 2.0);
+            box_y -= (box_h / 2.0);
+
+            boxes.push_back(box_x);
+            boxes.push_back(box_y);
+            boxes.push_back(box_w);
+            boxes.push_back(box_h);
+            boxScores.push_back(box_conf_f32 * class_prob_f32);
+            classId.push_back(maxClassId);
+            validCount++;
+          }
+        }
+      }
+    }
+  }
+  return validCount;
+}
+
+int RKYOLOPostprocessor::QuickSortIndiceInverse(std::vector<float>& input,
+                                                int left, int right,
+                                                std::vector<int>& indices) {
+  float key;
+  int key_index;
+  int low = left;
+  int high = right;
+  if (left < right) {
+    key_index = indices[left];
+    key = input[left];
+    while (low < high) {
+      while (low < high && input[high] <= key) {
+        high--;
+      }
+      input[low] = input[high];
+      indices[low] = indices[high];
+      while (low < high && input[low] >= key) {
+        low++;
+      }
+      input[high] = input[low];
+      indices[high] = indices[low];
+    }
+    input[low] = key;
+    indices[low] = key_index;
+    QuickSortIndiceInverse(input, left, low - 1, indices);
+    QuickSortIndiceInverse(input, low + 1, right, indices);
+  }
+  return low;
+}
+
+} // namespace detection
+} // namespace vision
+} // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
new file mode 100755
index 000000000..0332b2efd
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
@@ -0,0 +1,105 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+#include "fastdeploy/vision/common/processors/transform.h"
+#include "fastdeploy/vision/common/result.h"
+#include "fastdeploy/vision/detection/contrib/rknpu2/utils.h"
+#include <array>
+namespace fastdeploy {
+namespace vision {
+namespace detection {
+/*! @brief Postprocessor object for YOLOv5 serials model.
+ */
+class FASTDEPLOY_DECL RKYOLOPostprocessor {
+ public:
+  /** \brief Create a postprocessor instance for YOLOv5 serials model
+   */
+  RKYOLOPostprocessor();
+
+  /** \brief Process the result of runtime and fill to DetectionResult structure
+   *
+   * \param[in] tensors The inference result from runtime
+   * \param[in] result The output result of detection
+   * \param[in] ims_info The shape info list, record input_shape and output_shape
+   * \return true if the postprocess successed, otherwise false
+   */
+  bool Run(const std::vector<FDTensor>& tensors,
+           std::vector<DetectionResult>* results);
+
+  /// Set nms_threshold, default 0.45
+  void SetNMSThreshold(const float& nms_threshold) {
+    nms_threshold_ = nms_threshold;
+  }
+
+  /// Set conf_threshold, default 0.25
+  void SetConfThreshold(const float& conf_threshold) {
+    conf_threshold_ = conf_threshold;
+  }
+
+  /// Get conf_threshold, default 0.25
+  float GetConfThreshold() const { return conf_threshold_; }
+
+  /// Get nms_threshold, default 0.45
+  float GetNMSThreshold() const { return nms_threshold_; }
+
+  // Set model_type
+  void SetModelType(ModelType model_type);
+
+  // Set height and weight
+  void SetHeightAndWeight(int& height, int& width) {
+    height_ = height;
+    width_ = width;
+  }
+
+  // Set pad_hw_values
+  void SetPadHWValues(std::vector<std::vector<int>> pad_hw_values) {
+    pad_hw_values_ = pad_hw_values;
+  }
+
+  // Set scale
+  void SetScale(std::vector<float> scale) { scale_ = scale; }
+
+ private:
+  ModelType model_type_ = ModelType::UNKNOWN;
+  std::vector<int> anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
+                               45, 59, 119, 116, 90, 156, 198, 373, 326};
+  int strides_[3] = {8, 16, 32};
+  int height_ = 0;
+  int width_ = 0;
+  int anchor_per_branch_ = 0;
+
+  // Process Int8 Model
+  int ProcessInt8(int8_t* input, int* anchor, int grid_h, int grid_w,
+                  int stride, std::vector<float>& boxes,
+                  std::vector<float>& boxScores, std::vector<int>& classId,
+                  float threshold, int32_t zp, float scale);
+
+  // Model
+  int QuickSortIndiceInverse(std::vector<float>& input, int left, int right,
+                             std::vector<int>& indices);
+
+  // post_process values
+  std::vector<std::vector<int>> pad_hw_values_;
+  std::vector<float> scale_;
+  float nms_threshold_ = 0.45;
+  float conf_threshold_ = 0.25;
+  int prob_box_size = 85;
+  int obj_class_num = 80;
+  int obj_num_bbox_max_size = 200;
+};
+
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
new file mode 100755
index 000000000..29480459b
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
@@ -0,0 +1,127 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h"
+#include "fastdeploy/function/concat.h"
+
+namespace fastdeploy {
+namespace vision {
+namespace detection {
+
+RKYOLOPreprocessor::RKYOLOPreprocessor() {
+  size_ = {640, 640};
+  padding_value_ = {114.0, 114.0, 114.0};
+  is_mini_pad_ = false;
+  is_no_pad_ = false;
+  is_scale_up_ = true;
+  stride_ = 32;
+  max_wh_ = 7680.0;
+}
+
+void RKYOLOPreprocessor::LetterBox(FDMat* mat) {
+  std::cout << "mat->Height() = " << mat->Height() << std::endl;
+  std::cout << "mat->Width() = " << mat->Width() << std::endl;
+
+  float scale =
+      std::min(size_[1] * 1.0 / mat->Height(), size_[0] * 1.0 / mat->Width());
+  std::cout << "RKYOLOPreprocessor scale_ = " << scale << std::endl;
+  if (!is_scale_up_) {
+    scale = std::min(scale, 1.0f);
+  }
+  std::cout << "RKYOLOPreprocessor scale_ = " << scale << std::endl;
+  scale_.push_back(scale);
+
+  int resize_h = int(round(mat->Height() * scale));
+  int resize_w = int(round(mat->Width() * scale));
+
+  int pad_w = size_[0] - resize_w;
+  int pad_h = size_[1] - resize_h;
+  if (is_mini_pad_) {
+    pad_h = pad_h % stride_;
+    pad_w = pad_w % stride_;
+  } else if (is_no_pad_) {
+    pad_h = 0;
+    pad_w = 0;
+    resize_h = size_[1];
+    resize_w = size_[0];
+  }
+
+  pad_hw_values_.push_back({pad_h,pad_w});
+
+  if (std::fabs(scale - 1.0f) > 1e-06) {
+    Resize::Run(mat, resize_w, resize_h);
+  }
+  if (pad_h > 0 || pad_w > 0) {
+    float half_h = pad_h * 1.0 / 2;
+    int top = int(round(half_h - 0.1));
+    int bottom = int(round(half_h + 0.1));
+    float half_w = pad_w * 1.0 / 2;
+    int left = int(round(half_w - 0.1));
+    int right = int(round(half_w + 0.1));
+    Pad::Run(mat, top, bottom, left, right, padding_value_);
+  }
+}
+
+bool RKYOLOPreprocessor::Preprocess(FDMat* mat, FDTensor* output) {
+  // process after image load
+//  float ratio = std::min(size_[1] * 1.0f / static_cast<float>(mat->Height()),
+//                         size_[0] * 1.0f / static_cast<float>(mat->Width()));
+//  if (std::fabs(ratio - 1.0f) > 1e-06) {
+//    int interp = cv::INTER_AREA;
+//    if (ratio > 1.0) {
+//      interp = cv::INTER_LINEAR;
+//    }
+//    int resize_h = int(mat->Height() * ratio);
+//    int resize_w = int(mat->Width() * ratio);
+//    Resize::Run(mat, resize_w, resize_h, -1, -1, interp);
+//  }
+
+  // RKYOLO's preprocess steps
+  // 1. letterbox
+  // 2. convert_and_permute(swap_rb=true)
+  LetterBox(mat);
+  BGR2RGB::Run(mat);
+  mat->ShareWithTensor(output);
+  output->ExpandDim(0); // reshape to n, h, w, c
+  return true;
+}
+
+bool RKYOLOPreprocessor::Run(std::vector<FDMat>* images,
+                             std::vector<FDTensor>* outputs) {
+  if (images->size() == 0) {
+    FDERROR << "The size of input images should be greater than 0."
+            << std::endl;
+    return false;
+  }
+  outputs->resize(1);
+  // Concat all the preprocessed data to a batch tensor
+  std::vector<FDTensor> tensors(images->size());
+  for (size_t i = 0; i < images->size(); ++i) {
+    if (!Preprocess(&(*images)[i], &tensors[i])) {
+      FDERROR << "Failed to preprocess input image." << std::endl;
+      return false;
+    }
+  }
+
+  if (tensors.size() == 1) {
+    (*outputs)[0] = std::move(tensors[0]);
+  } else {
+    function::Concat(tensors, &((*outputs)[0]), 0);
+  }
+  return true;
+}
+
+} // namespace detection
+} // namespace vision
+} // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h
new file mode 100755
index 000000000..e6ecfe452
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h
@@ -0,0 +1,100 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+#include "fastdeploy/vision/common/processors/transform.h"
+#include "fastdeploy/vision/common/result.h"
+
+namespace fastdeploy {
+namespace vision {
+
+namespace detection {
+/*! @brief Preprocessor object for YOLOv5 serials model.
+ */
+class FASTDEPLOY_DECL RKYOLOPreprocessor {
+ public:
+  /** \brief Create a preprocessor instance for YOLOv5 serials model
+   */
+  RKYOLOPreprocessor();
+
+  /** \brief Process the input image and prepare input tensors for runtime
+   *
+   * \param[in] images The input image data list, all the elements are returned by cv::imread()
+   * \param[in] outputs The output tensors which will feed in runtime
+   * \param[in] ims_info The shape info list, record input_shape and output_shape
+   * \return true if the preprocess successed, otherwise false
+   */
+  bool Run(std::vector<FDMat>* images, std::vector<FDTensor>* outputs);
+
+  /// Set target size, tuple of (width, height), default size = {640, 640}
+  void SetSize(const std::vector<int>& size) { size_ = size; }
+
+  /// Get target size, tuple of (width, height), default size = {640, 640}
+  std::vector<int> GetSize() const { return size_; }
+
+  /// Set padding value, size should be the same as channels
+  void SetPaddingValue(const std::vector<float>& padding_value) {
+    padding_value_ = padding_value;
+  }
+
+  /// Get padding value, size should be the same as channels
+  std::vector<float> GetPaddingValue() const { return padding_value_; }
+
+  /// Set is_scale_up, if is_scale_up is false, the input image only
+  /// can be zoom out, the maximum resize scale cannot exceed 1.0, default true
+  void SetScaleUp(bool is_scale_up) { is_scale_up_ = is_scale_up; }
+
+  /// Get is_scale_up, default true
+  bool GetScaleUp() const { return is_scale_up_; }
+
+  std::vector<std::vector<int>> GetPadHWValues() const {
+    return pad_hw_values_;
+  }
+  std::vector<float> GetScale() const { return scale_; }
+
+ protected:
+  bool Preprocess(FDMat* mat, FDTensor* output);
+
+  void LetterBox(FDMat* mat);
+
+  // target size, tuple of (width, height), default size = {640, 640}
+  std::vector<int> size_;
+
+  // padding value, size should be the same as channels
+  std::vector<float> padding_value_;
+
+  // only pad to the minimum rectange which height and width is times of stride
+  bool is_mini_pad_;
+
+  // while is_mini_pad = false and is_no_pad = true,
+  // will resize the image to the set size
+  bool is_no_pad_;
+
+  // if is_scale_up is false, the input image only can be zoom out,
+  // the maximum resize scale cannot exceed 1.0
+  bool is_scale_up_;
+
+  // padding stride, for is_mini_pad
+  int stride_;
+
+  // for offseting the boxes by classes when using NMS
+  float max_wh_;
+
+  std::vector<std::vector<int>> pad_hw_values_;
+  std::vector<float> scale_;
+};
+
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
new file mode 100644
index 000000000..017cb1be3
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
@@ -0,0 +1,73 @@
+#include "fastdeploy/vision/detection/contrib/rknpu2/rkyolo.h"
+
+namespace fastdeploy {
+namespace vision {
+namespace detection {
+
+RKYOLO::RKYOLO(const std::string& model_file,
+               const fastdeploy::RuntimeOption& custom_option,
+               const fastdeploy::ModelFormat& model_format) {
+  if (model_format == ModelFormat::RKNN) {
+    valid_cpu_backends = {};
+    valid_gpu_backends = {};
+    valid_rknpu_backends = {Backend::RKNPU2};
+  } else {
+    FDERROR << "RKYOLO Only Support run in RKNPU2" << std::endl;
+  }
+  runtime_option = custom_option;
+  runtime_option.model_format = model_format;
+  runtime_option.model_file = model_file;
+  initialized = Initialize();
+}
+
+bool RKYOLO::Initialize() {
+  if (!InitRuntime()) {
+    FDERROR << "Failed to initialize fastdeploy backend." << std::endl;
+    return false;
+  }
+  auto size = GetPreprocessor().GetSize();
+  GetPostprocessor().SetHeightAndWeight(size[0],size[1]);
+  return true;
+}
+
+bool RKYOLO::Predict(const cv::Mat& im,
+                     DetectionResult* result) {
+  std::vector<DetectionResult> results;
+  if (!BatchPredict({im}, &results)) {
+    return false;
+  }
+  *result = std::move(results[0]);
+  return true;
+}
+
+bool RKYOLO::BatchPredict(const std::vector<cv::Mat>& images,
+                          std::vector<DetectionResult>* results) {
+  std::vector<FDMat> fd_images = WrapMat(images);
+
+  if (!preprocessor_.Run(&fd_images, &reused_input_tensors_)) {
+    FDERROR << "Failed to preprocess the input image." << std::endl;
+    return false;
+  }
+  auto pad_hw_values_ = preprocessor_.GetPadHWValues();
+  postprocessor_.SetPadHWValues(preprocessor_.GetPadHWValues());
+  std::cout << "preprocessor_ scale_ = " << preprocessor_.GetScale()[0] << std::endl;
+  postprocessor_.SetScale(preprocessor_.GetScale());
+
+  reused_input_tensors_[0].name = InputInfoOfRuntime(0).name;
+  if (!Infer(reused_input_tensors_, &reused_output_tensors_)) {
+    FDERROR << "Failed to inference by runtime." << std::endl;
+    return false;
+  }
+
+
+  if (!postprocessor_.Run(reused_output_tensors_, results)) {
+    FDERROR << "Failed to postprocess the inference results by runtime." << std::endl;
+    return false;
+  }
+
+  return true;
+}
+
+} // namespace detection
+} // namespace vision
+} // namespace fastdeploy
\ No newline at end of file
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.h b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.h
new file mode 100644
index 000000000..d7190eb73
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.h
@@ -0,0 +1,64 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.  //NOLINT
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+
+#include "fastdeploy/fastdeploy_model.h"
+#include "fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h"
+#include "fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h"
+
+namespace fastdeploy {
+namespace vision {
+namespace detection {
+
+class FASTDEPLOY_DECL RKYOLO : public FastDeployModel {
+ public:
+  RKYOLO(const std::string& model_file,
+         const RuntimeOption& custom_option = RuntimeOption(),
+         const ModelFormat& model_format = ModelFormat::RKNN);
+
+  std::string ModelName() const { return "RKYOLO"; }
+
+  /** \brief Predict the detection result for an input image
+   *
+   * \param[in] img The input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format
+   * \param[in] result The output detection result will be writen to this structure
+   * \return true if the prediction successed, otherwise false
+   */
+  virtual bool Predict(const cv::Mat& img, DetectionResult* result);
+
+  /** \brief Predict the detection results for a batch of input images
+   *
+   * \param[in] imgs, The input image list, each element comes from cv::imread()
+   * \param[in] results The output detection result list
+   * \return true if the prediction successed, otherwise false
+   */
+  virtual bool BatchPredict(const std::vector<cv::Mat>& imgs,
+                            std::vector<DetectionResult>* results);
+
+  /// Get preprocessor reference of YOLOv5
+  RKYOLOPreprocessor& GetPreprocessor() { return preprocessor_; }
+
+  /// Get postprocessor reference of YOLOv5
+  RKYOLOPostprocessor& GetPostprocessor() { return postprocessor_; }
+
+ protected:
+  bool Initialize();
+  RKYOLOPreprocessor preprocessor_;
+  RKYOLOPostprocessor postprocessor_;
+};
+
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/rkyolo_pybind.cc b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo_pybind.cc
new file mode 100755
index 000000000..716464458
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo_pybind.cc
@@ -0,0 +1,95 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/pybind/main.h"
+
+namespace fastdeploy {
+void BindRKYOLO(pybind11::module& m) {
+  pybind11::class_<vision::detection::RKYOLOPreprocessor>(
+      m, "RKYOLOPreprocessor")
+      .def(pybind11::init<>())
+      .def("run", [](vision::detection::RKYOLOPreprocessor& self,
+                     std::vector<pybind11::array>& im_list) {
+        std::vector<vision::FDMat> images;
+        for (size_t i = 0; i < im_list.size(); ++i) {
+          images.push_back(vision::WrapMat(PyArrayToCvMat(im_list[i])));
+        }
+        std::vector<FDTensor> outputs;
+        if (!self.Run(&images, &outputs)) {
+          throw std::runtime_error("Failed to preprocess the input data in PaddleClasPreprocessor.");
+        }
+        for (size_t i = 0; i < outputs.size(); ++i) {
+          outputs[i].StopSharing();
+        }
+        return outputs;
+      })
+      .def_property("size", &vision::detection::RKYOLOPreprocessor::GetSize,
+                    &vision::detection::RKYOLOPreprocessor::SetSize)
+      .def_property("padding_value", &vision::detection::RKYOLOPreprocessor::GetPaddingValue,
+                    &vision::detection::RKYOLOPreprocessor::SetPaddingValue)
+      .def_property("is_scale_up", &vision::detection::RKYOLOPreprocessor::GetScaleUp,
+                    &vision::detection::RKYOLOPreprocessor::SetScaleUp);
+
+  pybind11::class_<vision::detection::RKYOLOPostprocessor>(
+      m, "RKYOLOPostprocessor")
+      .def(pybind11::init<>())
+      .def("run", [](vision::detection::RKYOLOPostprocessor& self,
+                     std::vector<FDTensor>& inputs) {
+        std::vector<vision::DetectionResult> results;
+        if (!self.Run(inputs, &results)) {
+          throw std::runtime_error("Failed to postprocess the runtime result in RKYOLOV5Postprocessor.");
+        }
+        return results;
+      })
+      .def("run", [](vision::detection::RKYOLOPostprocessor& self,
+                     std::vector<pybind11::array>& input_array) {
+        std::vector<vision::DetectionResult> results;
+        std::vector<FDTensor> inputs;
+        PyArrayToTensorList(input_array, &inputs, /*share_buffer=*/true);
+        if (!self.Run(inputs, &results)) {
+          throw std::runtime_error("Failed to postprocess the runtime result in RKYOLOV5Postprocessor.");
+        }
+        return results;
+      })
+      .def_property("conf_threshold", &vision::detection::RKYOLOPostprocessor::GetConfThreshold,
+                    &vision::detection::RKYOLOPostprocessor::SetConfThreshold)
+      .def_property("nms_threshold", &vision::detection::RKYOLOPostprocessor::GetNMSThreshold,
+                    &vision::detection::RKYOLOPostprocessor::SetNMSThreshold);
+
+  pybind11::class_<vision::detection::RKYOLOV5, FastDeployModel>(m, "RKYOLOV5")
+      .def(pybind11::init<std::string,
+                          RuntimeOption,
+                          ModelFormat>())
+      .def("predict",
+           [](vision::detection::RKYOLOV5& self,
+              pybind11::array& data) {
+             auto mat = PyArrayToCvMat(data);
+             vision::DetectionResult res;
+             self.Predict(mat, &res);
+             return res;
+           })
+      .def("batch_predict", [](vision::detection::RKYOLOV5& self,
+                               std::vector<pybind11::array>& data) {
+        std::vector<cv::Mat> images;
+        for (size_t i = 0; i < data.size(); ++i) {
+          images.push_back(PyArrayToCvMat(data[i]));
+        }
+        std::vector<vision::DetectionResult> results;
+        self.BatchPredict(images, &results);
+        return results;
+      })
+      .def_property_readonly("preprocessor", &vision::detection::RKYOLOV5::GetPreprocessor)
+      .def_property_readonly("postprocessor", &vision::detection::RKYOLOV5::GetPostprocessor);
+}
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/utils.cc b/fastdeploy/vision/detection/contrib/rknpu2/utils.cc
new file mode 100644
index 000000000..faac26983
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/utils.cc
@@ -0,0 +1,93 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.  //NOLINT
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#include "fastdeploy/vision/detection/contrib/rknpu2/utils.h"
+float clamp(float val, int min, int max) {
+  return val > min ? (val < max ? val : max) : min;
+}
+
+float Sigmoid(float x) { return 1.0 / (1.0 + expf(-x)); }
+
+float UnSigmoid(float y) { return -1.0 * logf((1.0 / y) - 1.0); }
+
+inline int32_t __clip(float val, float min, float max) {
+  float f = val <= min ? min : (val >= max ? max : val);
+  return f;
+}
+
+int8_t QntF32ToAffine(float f32, int32_t zp, float scale) {
+  float dst_val = (f32 / scale) + zp;
+  int8_t res = (int8_t)__clip(dst_val, -128, 127);
+  return res;
+}
+
+float DeqntAffineToF32(int8_t qnt, int32_t zp, float scale) {
+  return ((float)qnt - (float)zp) * scale;
+}
+
+static float CalculateOverlap(float xmin0, float ymin0, float xmax0, float ymax0, float xmin1, float ymin1, float xmax1, float ymax1)
+{
+  float w = fmax(0.f, fmin(xmax0, xmax1) - fmax(xmin0, xmin1) + 1.0);
+  float h = fmax(0.f, fmin(ymax0, ymax1) - fmax(ymin0, ymin1) + 1.0);
+  float i = w * h;
+  float u = (xmax0 - xmin0 + 1.0) * (ymax0 - ymin0 + 1.0) + (xmax1 - xmin1 + 1.0) * (ymax1 - ymin1 + 1.0) - i;
+  return u <= 0.f ? 0.f : (i / u);
+}
+
+int NMS(int validCount,
+        std::vector<float> &outputLocations,
+        std::vector<int> &class_id,
+        std::vector<int> &order,
+        float threshold,
+        bool class_agnostic)
+{
+  // printf("class_agnostic: %d\n", class_agnostic);
+  for (int i = 0; i < validCount; ++i)
+  {
+    if (order[i] == -1)
+    {
+      continue;
+    }
+    int n = order[i];
+    for (int j = i + 1; j < validCount; ++j)
+    {
+      int m = order[j];
+      if (m == -1)
+      {
+        continue;
+      }
+
+      if (!class_agnostic && class_id[n] != class_id[m]){
+        continue;
+      }
+
+      float xmin0 = outputLocations[n * 4 + 0];
+      float ymin0 = outputLocations[n * 4 + 1];
+      float xmax0 = outputLocations[n * 4 + 0] + outputLocations[n * 4 + 2];
+      float ymax0 = outputLocations[n * 4 + 1] + outputLocations[n * 4 + 3];
+
+      float xmin1 = outputLocations[m * 4 + 0];
+      float ymin1 = outputLocations[m * 4 + 1];
+      float xmax1 = outputLocations[m * 4 + 0] + outputLocations[m * 4 + 2];
+      float ymax1 = outputLocations[m * 4 + 1] + outputLocations[m * 4 + 3];
+
+      float iou = CalculateOverlap(xmin0, ymin0, xmax0, ymax0, xmin1, ymin1, xmax1, ymax1);
+
+      if (iou > threshold)
+      {
+        order[j] = -1;
+      }
+    }
+  }
+  return 0;
+}
\ No newline at end of file
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/utils.h b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
new file mode 100644
index 000000000..4414cb8a5
--- /dev/null
+++ b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
@@ -0,0 +1,26 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.  //NOLINT
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#pragma once
+#include <cmath>
+#include <vector>
+typedef enum { RKYOLOX = 0, RKYOLOV5, RKYOLOV7, UNKNOWN } ModelType;
+float clamp(float val, int min, int max);
+float Sigmoid(float x);
+float UnSigmoid(float y);
+inline static int32_t __clip(float val, float min, float max);
+int8_t QntF32ToAffine(float f32, int32_t zp, float scale);
+float DeqntAffineToF32(int8_t qnt, int32_t zp, float scale);
+int NMS(int validCount, std::vector<float>& outputLocations,
+        std::vector<int>& class_id, std::vector<int>& order, float threshold,
+        bool class_agnostic);
diff --git a/fastdeploy/vision/detection/detection_pybind.cc b/fastdeploy/vision/detection/detection_pybind.cc
index b3a7a6ad9..9d585e18c 100644
--- a/fastdeploy/vision/detection/detection_pybind.cc
+++ b/fastdeploy/vision/detection/detection_pybind.cc
@@ -27,6 +27,7 @@ void BindNanoDetPlus(pybind11::module& m);
 void BindPPDet(pybind11::module& m);
 void BindYOLOv7End2EndTRT(pybind11::module& m);
 void BindYOLOv7End2EndORT(pybind11::module& m);
+void BindRKYOLO(pybind11::module& m);
 
 void BindDetection(pybind11::module& m) {
   auto detection_module =
@@ -42,5 +43,6 @@ void BindDetection(pybind11::module& m) {
   BindNanoDetPlus(detection_module);
   BindYOLOv7End2EndTRT(detection_module);
   BindYOLOv7End2EndORT(detection_module);
+  BindRKYOLO(detection_module);
 }
 }  // namespace fastdeploy
diff --git a/python/fastdeploy/vision/detection/__init__.py b/python/fastdeploy/vision/detection/__init__.py
index b5f01f3a7..afd1cd8ce 100755
--- a/python/fastdeploy/vision/detection/__init__.py
+++ b/python/fastdeploy/vision/detection/__init__.py
@@ -24,3 +24,4 @@ from .contrib.yolov6 import YOLOv6
 from .contrib.yolov7end2end_trt import YOLOv7End2EndTRT
 from .contrib.yolov7end2end_ort import YOLOv7End2EndORT
 from .ppdet import *
+from .contrib.rkyolo import *
diff --git a/python/fastdeploy/vision/detection/contrib/rkyolo/__init__.py b/python/fastdeploy/vision/detection/contrib/rkyolo/__init__.py
new file mode 100644
index 000000000..ce89483ce
--- /dev/null
+++ b/python/fastdeploy/vision/detection/contrib/rkyolo/__init__.py
@@ -0,0 +1,16 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from __future__ import absolute_import
+from .rkyolov5 import *
diff --git a/python/fastdeploy/vision/detection/contrib/rkyolo/rkyolov5.py b/python/fastdeploy/vision/detection/contrib/rkyolo/rkyolov5.py
new file mode 100644
index 000000000..bfefb2127
--- /dev/null
+++ b/python/fastdeploy/vision/detection/contrib/rkyolo/rkyolov5.py
@@ -0,0 +1,195 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from __future__ import absolute_import
+import logging
+from ..... import FastDeployModel, ModelFormat
+from ..... import c_lib_wrap as C
+
+
+class RKYOLOPreprocessor:
+    def __init__(self):
+        """Create a preprocessor for RKYOLOV5
+        """
+        self._preprocessor = C.vision.detection.RKYOLOPreprocessor()
+
+    def run(self, input_ims):
+        """Preprocess input images for RKYOLOV5
+
+        :param: input_ims: (list of numpy.ndarray)The input image
+        :return: list of FDTensor
+        """
+        return self._preprocessor.run(input_ims)
+
+    @property
+    def size(self):
+        """
+        Argument for image preprocessing step, the preprocess image size, tuple of (width, height), default size = [640, 640]
+        """
+        return self._preprocessor.size
+
+    @property
+    def padding_value(self):
+        """
+        padding value for preprocessing, default [114.0, 114.0, 114.0]
+        """
+        #  padding value, size should be the same as channels
+        return self._preprocessor.padding_value
+
+    @property
+    def is_scale_up(self):
+        """
+        is_scale_up for preprocessing, the input image only can be zoom out, the maximum resize scale cannot exceed 1.0, default true
+        """
+        return self._preprocessor.is_scale_up
+
+    @size.setter
+    def size(self, wh):
+        assert isinstance(wh, (list, tuple)), \
+            "The value to set `size` must be type of tuple or list."
+        assert len(wh) == 2, \
+            "The value to set `size` must contatins 2 elements means [width, height], but now it contains {} elements.".format(
+                len(wh))
+        self._preprocessor.size = wh
+
+    @padding_value.setter
+    def padding_value(self, value):
+        assert isinstance(
+            value,
+            list), "The value to set `padding_value` must be type of list."
+        self._preprocessor.padding_value = value
+
+    @is_scale_up.setter
+    def is_scale_up(self, value):
+        assert isinstance(
+            value,
+            bool), "The value to set `is_scale_up` must be type of bool."
+        self._preprocessor.is_scale_up = value
+
+
+class RKYOLOPostprocessor:
+    def __init__(self):
+        """Create a postprocessor for RKYOLOV5
+        """
+        self._postprocessor = C.vision.detection.RKYOLOPostprocessor()
+
+    def run(self, runtime_results):
+        """Postprocess the runtime results for RKYOLOV5
+
+        :param: runtime_results: (list of FDTensor)The output FDTensor results from runtime
+        :param: ims_info: (list of dict)Record input_shape and output_shape
+        :return: list of DetectionResult(If the runtime_results is predict by batched samples, the length of this list equals to the batch size)
+        """
+        return self._postprocessor.run(runtime_results)
+
+    @property
+    def conf_threshold(self):
+        """
+        confidence threshold for postprocessing, default is 0.25
+        """
+        return self._postprocessor.conf_threshold
+
+    @property
+    def nms_threshold(self):
+        """
+        nms threshold for postprocessing, default is 0.5
+        """
+        return self._postprocessor.nms_threshold
+
+    @property
+    def multi_label(self):
+        """
+        multi_label for postprocessing, set true for eval, default is True
+        """
+        return self._postprocessor.multi_label
+
+    @conf_threshold.setter
+    def conf_threshold(self, conf_threshold):
+        assert isinstance(conf_threshold, float), \
+            "The value to set `conf_threshold` must be type of float."
+        self._postprocessor.conf_threshold = conf_threshold
+
+    @nms_threshold.setter
+    def nms_threshold(self, nms_threshold):
+        assert isinstance(nms_threshold, float), \
+            "The value to set `nms_threshold` must be type of float."
+        self._postprocessor.nms_threshold = nms_threshold
+
+    @multi_label.setter
+    def multi_label(self, value):
+        assert isinstance(
+            value,
+            bool), "The value to set `multi_label` must be type of bool."
+        self._postprocessor.multi_label = value
+
+
+class RKYOLOV5(FastDeployModel):
+    def __init__(self,
+                 model_file,
+                 params_file="",
+                 runtime_option=None,
+                 model_format=ModelFormat.ONNX):
+        """Load a RKYOLOV5 model exported by RKYOLOV5.
+
+        :param model_file: (str)Path of model file, e.g ./yolov5.onnx
+        :param params_file: (str)Path of parameters file, e.g yolox/model.pdiparams, if the model_fomat is ModelFormat.ONNX, this param will be ignored, can be set as empty string
+        :param runtime_option: (fastdeploy.RuntimeOption)RuntimeOption for inference this model, if it's None, will use the default backend on CPU
+        :param model_format: (fastdeploy.ModelForamt)Model format of the loaded model
+        """
+        # 调用基函数进行backend_option的初始化
+        # 初始化后的option保存在self._runtime_option
+        super(RKYOLOV5, self).__init__(runtime_option)
+
+        self._model = C.vision.detection.RKYOLOV5(
+            model_file, self._runtime_option, model_format)
+        # 通过self.initialized判断整个模型的初始化是否成功
+        assert self.initialized, "RKYOLOV5 initialize failed."
+
+    def predict(self, input_image, conf_threshold=0.25, nms_iou_threshold=0.5):
+        """Detect an input image
+
+        :param input_image: (numpy.ndarray)The input image data, 3-D array with layout HWC, BGR format
+        :param conf_threshold: confidence threshold for postprocessing, default is 0.25
+        :param nms_iou_threshold: iou threshold for NMS, default is 0.5
+        :return: DetectionResult
+        """
+
+        self.postprocessor.conf_threshold = conf_threshold
+        self.postprocessor.nms_threshold = nms_iou_threshold
+        return self._model.predict(input_image)
+
+    def batch_predict(self, images):
+        """Classify a batch of input image
+
+        :param im: (list of numpy.ndarray) The input image list, each element is a 3-D array with layout HWC, BGR format
+        :return list of DetectionResult
+        """
+
+        return self._model.batch_predict(images)
+
+    @property
+    def preprocessor(self):
+        """Get RKYOLOV5Preprocessor object of the loaded model
+
+        :return RKYOLOV5Preprocessor
+        """
+        return self._model.preprocessor
+
+    @property
+    def postprocessor(self):
+        """Get RKYOLOV5Postprocessor object of the loaded model
+
+        :return RKYOLOV5Postprocessor
+        """
+        return self._model.postprocessor

From e877f0fd073145dfef4c476fee3366356bd934a2 Mon Sep 17 00:00:00 2001
From: Winter <1558270516@qq.com>
Date: Sun, 11 Dec 2022 12:57:59 +0800
Subject: [PATCH 17/77] [Android] add VoiceAssistant app example (#834)

* [Android]add VoiceAssistant.

* Create VoiceAssistantDemo

* Update and rename VoiceAssistantDemo to VoiceAssistantDemo.md

* Update VoiceAssistantDemo.md

* Delete VoiceAssistantDemo.md

* [Android]1.delete about core folder.
2.build and configure bdasr_V3_20210628_cfe8c44.aar file.

* change app/build.gradle etc.

* Update build.gradle

Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com>
---
 java/android/app/build.gradle                 |  10 +-
 .../VoiceAssistantMainActivity.java           | 211 ++++++++++++++++++
 .../VoiceAssistantWelcomeActivity.java        |  30 +++
 .../layout/voice_assistant_activity_main.xml  |  89 ++++++++
 .../res/layout/voice_assistant_welcome.xml    |  76 +++++++
 java/android/ui/src/main/AndroidManifest.xml  |   2 +
 .../com/baidu/paddle/fastdeploy/ui/Utils.java |  26 +++
 7 files changed, 441 insertions(+), 3 deletions(-)
 create mode 100644 java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantMainActivity.java
 create mode 100644 java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantWelcomeActivity.java
 create mode 100644 java/android/app/src/main/res/layout/voice_assistant_activity_main.xml
 create mode 100644 java/android/app/src/main/res/layout/voice_assistant_welcome.xml

diff --git a/java/android/app/build.gradle b/java/android/app/build.gradle
index fde73b3b3..23b204135 100644
--- a/java/android/app/build.gradle
+++ b/java/android/app/build.gradle
@@ -5,7 +5,7 @@ android {
 
     defaultConfig {
         applicationId 'com.baidu.paddle.fastdeploy.app.examples'
-        minSdkVersion 15
+        minSdkVersion 16
         //noinspection ExpiredTargetSdkVersion
         targetSdkVersion 28
         versionCode 1
@@ -79,6 +79,10 @@ def FD_JAVA_SDK = [
         [
                 'src' : 'https://bj.bcebos.com/fastdeploy/test/fastdeploy-android-sdk-latest-dev.aar',
                 'dest': 'libs'
+        ],
+        [
+                'src' : 'https://bj.bcebos.com/fastdeploy/test/bdasr_V3_20210628_cfe8c44.aar',
+                'dest': 'libs'
         ]
 ]
 
@@ -132,7 +136,7 @@ task downloadAndExtractSDKs(type: DefaultTask) {
             boolean copyFiles = false
             if (!file("${sdk.dest}/${sdkName}").exists()) {
                 // Download the target SDK if not exists
-                if (file("${cachePath}/${sdkName}").exists()) {
+                if (!file("${cachePath}/${sdkName}").exists()) {
                     println "[INFO] Downloading ${sdk.src} -> ${cachePath}/${sdkName}"
                     ant.get(src: sdk.src, dest: file("${cachePath}/${sdkName}"))
                 }
@@ -152,4 +156,4 @@ task downloadAndExtractSDKs(type: DefaultTask) {
 }
 
 preBuild.dependsOn downloadAndExtractSDKs
-preBuild.dependsOn downloadAndExtractModels
\ No newline at end of file
+preBuild.dependsOn downloadAndExtractModels
diff --git a/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantMainActivity.java b/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantMainActivity.java
new file mode 100644
index 000000000..cd1592502
--- /dev/null
+++ b/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantMainActivity.java
@@ -0,0 +1,211 @@
+package com.baidu.paddle.fastdeploy.app.examples.ernie.applications;
+
+import static com.baidu.paddle.fastdeploy.ui.Utils.isNetworkAvailable;
+
+import android.Manifest;
+import android.app.Activity;
+import android.app.AlertDialog;
+import android.content.DialogInterface;
+import android.content.pm.PackageManager;
+import android.os.Build;
+import android.os.Bundle;
+import android.os.Handler;
+import android.os.Message;
+import android.support.annotation.NonNull;
+import android.support.annotation.Nullable;
+import android.util.Log;
+import android.view.View;
+import android.view.Window;
+import android.view.WindowManager;
+import android.widget.Button;
+import android.widget.ImageView;
+import android.widget.TextView;
+
+import com.baidu.aip.asrwakeup3.core.mini.AutoCheck;
+import com.baidu.aip.asrwakeup3.core.util.AuthUtil;
+import com.baidu.paddle.fastdeploy.app.examples.R;
+import com.baidu.speech.EventListener;
+import com.baidu.speech.EventManager;
+import com.baidu.speech.EventManagerFactory;
+import com.baidu.speech.asr.SpeechConstant;
+
+import org.json.JSONObject;
+
+import java.util.ArrayList;
+import java.util.LinkedHashMap;
+import java.util.List;
+import java.util.Map;
+
+public class VoiceAssistantMainActivity extends Activity implements View.OnClickListener, EventListener {
+    private Button startVoiceBtn;
+    private TextView voiceOutput;
+    private Button startIntentBtn;
+    private TextView intentOutput;
+    private ImageView back;
+    private EventManager asr;
+    private Boolean isStartVoice = false;
+    private String voiceTxt = "";
+    private int times = 0;
+    private final int REQUEST_PERMISSION = 0;
+
+    @Override
+    protected void onCreate(@Nullable Bundle savedInstanceState) {
+        super.onCreate(savedInstanceState);
+        // Fullscreen
+        requestWindowFeature(Window.FEATURE_NO_TITLE);
+        getWindow().setFlags(WindowManager.LayoutParams.FLAG_FULLSCREEN, WindowManager.LayoutParams.FLAG_FULLSCREEN);
+
+        setContentView(R.layout.voice_assistant_activity_main);
+
+        init();
+    }
+
+    private void init() {
+        checkPermission();
+        asr = EventManagerFactory.create(this, "asr");
+        asr.registerListener(this);
+        startVoiceBtn = findViewById(R.id.btn_voice);
+        startVoiceBtn.setOnClickListener(this);
+        voiceOutput = findViewById(R.id.tv_voice_output);
+        back = findViewById(R.id.iv_back);
+        back.setOnClickListener(this);
+        startIntentBtn = findViewById(R.id.btn_intent);
+        startIntentBtn.setOnClickListener(this);
+        intentOutput = findViewById(R.id.tv_intent_output);
+    }
+
+    @Override
+    public void onClick(View view) {
+        switch (view.getId()) {
+            case R.id.btn_voice:
+                if (!isNetworkAvailable(this)) {
+                    new AlertDialog.Builder(VoiceAssistantMainActivity.this)
+                            .setMessage("请先连接互联网。")
+                            .setCancelable(true)
+                            .show();
+                    return;
+                }
+                if (!isStartVoice) {
+                    isStartVoice = true;
+                    startVoiceBtn.setText("停止录音");
+                    start();
+                } else {
+                    isStartVoice = false;
+                    startVoiceBtn.setText("开始录音");
+                    stop();
+                }
+                break;
+            case R.id.iv_back:
+                finish();
+                break;
+            case R.id.btn_intent:
+                if (voiceTxt.equals("")) {
+                    new AlertDialog.Builder(VoiceAssistantMainActivity.this)
+                            .setMessage("请先录音。")
+                            .setCancelable(true)
+                            .show();
+                    return;
+                }
+                intentOutput.setText("我刚才说了：" + voiceTxt);
+                break;
+        }
+    }
+
+    @Override
+    public void onEvent(String name, String params, byte[] data, int offset, int length) {
+        if (name.equals(SpeechConstant.CALLBACK_EVENT_ASR_PARTIAL)) {
+            if (params.contains("\"final_result\"")) {
+                if (params.contains("[")) {
+                    voiceTxt = params.substring(params.lastIndexOf('[') + 1, params.lastIndexOf(']'));
+                }
+                voiceOutput.setText(voiceTxt);
+            }
+        }
+    }
+
+    private void start() {
+        Map<String, Object> params = AuthUtil.getParam();
+        String event = null;
+        event = SpeechConstant.ASR_START;
+        params.put(SpeechConstant.ACCEPT_AUDIO_VOLUME, false);
+        (new AutoCheck(getApplicationContext(), new Handler() {
+            public void handleMessage(Message msg) {
+                if (msg.what == 100) {
+                    AutoCheck autoCheck = (AutoCheck) msg.obj;
+                    synchronized (autoCheck) {
+                        String message = autoCheck.obtainErrorMessage();
+                        Log.e(getClass().getName(), message);
+                    }
+                }
+            }
+        }, false)).checkAsr(params);
+        String json = null;
+        json = new JSONObject(params).toString();
+        asr.send(event, json, null, 0, 0);
+    }
+
+    private void stop() {
+        asr.send(SpeechConstant.ASR_STOP, null, null, 0, 0);
+    }
+
+    @Override
+    protected void onPause() {
+        super.onPause();
+        asr.send(SpeechConstant.ASR_CANCEL, "{}", null, 0, 0);
+    }
+
+    @Override
+    protected void onDestroy() {
+        super.onDestroy();
+        asr.send(SpeechConstant.ASR_CANCEL, "{}", null, 0, 0);
+        asr.unregisterListener(this);
+    }
+
+    private void checkPermission() {
+        times++;
+        final List<String> permissionsList = new ArrayList<>();
+        if (Build.VERSION.SDK_INT >= Build.VERSION_CODES.M) {
+            if ((checkSelfPermission(Manifest.permission.RECORD_AUDIO) != PackageManager.PERMISSION_GRANTED))
+                permissionsList.add(Manifest.permission.RECORD_AUDIO);
+            if ((checkSelfPermission(Manifest.permission.ACCESS_NETWORK_STATE) != PackageManager.PERMISSION_GRANTED))
+                permissionsList.add(Manifest.permission.ACCESS_NETWORK_STATE);
+            if ((checkSelfPermission(Manifest.permission.INTERNET) != PackageManager.PERMISSION_GRANTED)) {
+                permissionsList.add(Manifest.permission.INTERNET);
+            }
+            if ((checkSelfPermission(Manifest.permission.WRITE_EXTERNAL_STORAGE) != PackageManager.PERMISSION_GRANTED)) {
+                permissionsList.add(Manifest.permission.WRITE_EXTERNAL_STORAGE);
+            }
+            if (permissionsList.size() != 0) {
+                if (times == 1) {
+                    requestPermissions(permissionsList.toArray(new String[permissionsList.size()]),
+                            REQUEST_PERMISSION);
+                } else {
+                    new AlertDialog.Builder(this)
+                            .setCancelable(true)
+                            .setTitle("提示")
+                            .setMessage("获取不到授权，APP将无法正常使用，请允许APP获取权限！")
+                            .setPositiveButton("确定", new DialogInterface.OnClickListener() {
+                                @Override
+                                public void onClick(DialogInterface arg0, int arg1) {
+                                    if (Build.VERSION.SDK_INT >= Build.VERSION_CODES.M) {
+                                        requestPermissions(permissionsList.toArray(new String[permissionsList.size()]),
+                                                REQUEST_PERMISSION);
+                                    }
+                                }
+                            }).setNegativeButton("取消", new DialogInterface.OnClickListener() {
+                                @Override
+                                public void onClick(DialogInterface arg0, int arg1) {
+                                    finish();
+                                }
+                            }).show();
+                }
+            }
+        }
+    }
+
+    @Override
+    public void onRequestPermissionsResult(int requestCode, @NonNull String[] permissions, @NonNull int[] grantResults) {
+        super.onRequestPermissionsResult(requestCode, permissions, grantResults);
+        checkPermission();
+    }
+}
diff --git a/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantWelcomeActivity.java b/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantWelcomeActivity.java
new file mode 100644
index 000000000..f81c1c0ca
--- /dev/null
+++ b/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantWelcomeActivity.java
@@ -0,0 +1,30 @@
+package com.baidu.paddle.fastdeploy.app.examples.ernie.applications;
+
+import android.app.Activity;
+import android.content.Intent;
+import android.graphics.Color;
+import android.os.Build;
+import android.os.Bundle;
+import android.support.annotation.Nullable;
+import android.view.View;
+
+import com.baidu.paddle.fastdeploy.app.examples.R;
+
+public class VoiceAssistantWelcomeActivity extends Activity {
+    @Override
+    protected void onCreate(@Nullable Bundle savedInstanceState) {
+        super.onCreate(savedInstanceState);
+        if (Build.VERSION.SDK_INT > Build.VERSION_CODES.LOLLIPOP) {
+            getWindow().getDecorView().setSystemUiVisibility(View.SYSTEM_UI_FLAG_LAYOUT_FULLSCREEN
+                    | View.SYSTEM_UI_FLAG_LAYOUT_STABLE
+            );
+            getWindow().setStatusBarColor(Color.TRANSPARENT);
+        }
+        setContentView(R.layout.voice_assistant_welcome);
+    }
+
+    public void startActivity(View view) {
+        Intent intent = new Intent(VoiceAssistantWelcomeActivity.this, VoiceAssistantMainActivity.class);
+        startActivity(intent);
+    }
+}
diff --git a/java/android/app/src/main/res/layout/voice_assistant_activity_main.xml b/java/android/app/src/main/res/layout/voice_assistant_activity_main.xml
new file mode 100644
index 000000000..c6376ac38
--- /dev/null
+++ b/java/android/app/src/main/res/layout/voice_assistant_activity_main.xml
@@ -0,0 +1,89 @@
+<?xml version="1.0" encoding="utf-8"?>
+<LinearLayout xmlns:android="http://schemas.android.com/apk/res/android"
+    android:layout_width="match_parent"
+    android:layout_height="match_parent"
+    android:orientation="vertical">
+
+    <com.baidu.paddle.fastdeploy.ui.layout.ActionBarLayout
+        android:layout_width="match_parent"
+        android:layout_height="wrap_content">
+
+        <ImageView
+            android:id="@+id/iv_back"
+            android:layout_width="wrap_content"
+            android:layout_height="wrap_content"
+            android:cropToPadding="true"
+            android:paddingLeft="40px"
+            android:paddingTop="60px"
+            android:paddingRight="60px"
+            android:paddingBottom="40px"
+            android:src="@drawable/back_btn" />
+
+        <TextView
+            style="@style/action_btn"
+            android:layout_width="wrap_content"
+            android:layout_height="wrap_content"
+            android:layout_centerHorizontal="true"
+            android:layout_marginTop="50px"
+            android:text="@string/voice_assistant_app_name"
+            android:textSize="15sp" />
+    </com.baidu.paddle.fastdeploy.ui.layout.ActionBarLayout>
+
+    <LinearLayout
+        android:layout_width="match_parent"
+        android:layout_height="match_parent"
+        android:gravity="center"
+        android:orientation="vertical">
+
+        <Button
+            android:id="@+id/btn_voice"
+            android:layout_width="wrap_content"
+            android:layout_height="wrap_content"
+            android:layout_gravity="center"
+            android:text="开始录音" />
+
+        <TextView
+            android:layout_width="match_parent"
+            android:layout_height="wrap_content"
+            android:layout_marginLeft="20dp"
+            android:layout_marginTop="20dp"
+            android:layout_marginRight="20dp"
+            android:text="语音转文字结果：" />
+
+        <TextView
+            android:id="@+id/tv_voice_output"
+            android:layout_width="match_parent"
+            android:layout_height="wrap_content"
+            android:layout_marginLeft="20dp"
+            android:layout_marginTop="10dp"
+            android:layout_marginRight="20dp"
+            android:textColor="@android:color/black"
+            android:textSize="20sp" />
+
+        <Button
+            android:id="@+id/btn_intent"
+            android:layout_width="wrap_content"
+            android:layout_height="wrap_content"
+            android:layout_gravity="center"
+            android:layout_marginTop="20dp"
+            android:text="开始意图识别" />
+
+        <TextView
+            android:layout_width="match_parent"
+            android:layout_height="wrap_content"
+            android:layout_marginLeft="20dp"
+            android:layout_marginTop="20dp"
+            android:layout_marginRight="20dp"
+            android:text="意图识别结果：" />
+
+        <TextView
+            android:id="@+id/tv_intent_output"
+            android:layout_width="match_parent"
+            android:layout_height="wrap_content"
+            android:layout_marginLeft="20dp"
+            android:layout_marginTop="10dp"
+            android:layout_marginRight="20dp"
+            android:textColor="@android:color/black"
+            android:textSize="20sp" />
+    </LinearLayout>
+</LinearLayout>
\ No newline at end of file
diff --git a/java/android/app/src/main/res/layout/voice_assistant_welcome.xml b/java/android/app/src/main/res/layout/voice_assistant_welcome.xml
new file mode 100644
index 000000000..2b3a1a7ea
--- /dev/null
+++ b/java/android/app/src/main/res/layout/voice_assistant_welcome.xml
@@ -0,0 +1,76 @@
+<?xml version="1.0" encoding="utf-8"?>
+<FrameLayout
+    xmlns:android="http://schemas.android.com/apk/res/android"
+    android:layout_width="match_parent"
+    android:layout_height="match_parent">
+
+    <ImageView
+        android:id="@+id/imageView"
+        android:layout_width="match_parent"
+        android:layout_height="match_parent"
+        android:scaleType="centerCrop"
+        android:background="@drawable/main_bk"
+        />
+
+    <RelativeLayout
+        android:layout_width="match_parent"
+        android:layout_height="match_parent">
+
+        <TextView
+            android:id="@+id/model_text"
+            android:layout_width="320dp"
+            android:layout_height="wrap_content"
+            android:layout_centerHorizontal="true"
+            android:layout_marginTop="120dp"
+            android:background="@color/colorStartBtn"
+            android:gravity="center"
+            android:text="VoiceAssistant"
+            android:textColor="@color/colorTextWrite"
+            android:textSize="30sp" />
+
+        <TextView
+            android:id="@+id/baidu"
+            android:layout_width="wrap_content"
+            android:layout_height="wrap_content"
+            android:layout_below="@id/model_text"
+            android:layout_centerHorizontal="true"
+            android:layout_marginTop="20dp"
+            android:text="百度FastDeploy"
+            android:textColor="@color/colorTextWrite"
+            android:textSize="22sp" />
+
+        <TextView
+            android:layout_width="wrap_content"
+            android:layout_height="wrap_content"
+            android:layout_below="@id/baidu"
+            android:layout_centerHorizontal="true"
+            android:layout_marginTop="10dp"
+            android:text="Powered by EasyEdge"
+            android:textColor="@color/colorTextWrite"
+            android:textSize="18sp" />
+
+        <Button
+
+            android:id="@+id/start_ui_activity"
+            android:layout_width="200dp"
+            android:layout_height="50dp"
+            android:layout_alignParentBottom="true"
+            android:layout_centerHorizontal="true"
+            android:layout_marginBottom="70dp"
+            android:background="@drawable/round_corner_btn"
+            android:text="@string/start_ui_activity"
+            android:textColor="@color/colorTextWrite"
+            android:textSize="22sp"
+            android:onClick="startActivity"/>
+
+        <ImageView
+            android:id="@+id/logo"
+            android:layout_width="95dp"
+            android:layout_height="30dp"
+            android:layout_alignParentBottom="true"
+            android:layout_centerHorizontal="true"
+            android:layout_marginBottom="10dp"
+            android:background="@drawable/paddle_logo"
+            android:scaleType="centerCrop" />
+    </RelativeLayout>
+</FrameLayout>
diff --git a/java/android/ui/src/main/AndroidManifest.xml b/java/android/ui/src/main/AndroidManifest.xml
index f6656e33d..207a95ed4 100644
--- a/java/android/ui/src/main/AndroidManifest.xml
+++ b/java/android/ui/src/main/AndroidManifest.xml
@@ -1,4 +1,6 @@
 <?xml version="1.0" encoding="utf-8"?>
 <manifest xmlns:android="http://schemas.android.com/apk/res/android"
     package="com.baidu.paddle.fastdeploy.ui">
+
+    <uses-permission android:name="android.permission.ACCESS_NETWORK_STATE" />
 </manifest>
\ No newline at end of file
diff --git a/java/android/ui/src/main/java/com/baidu/paddle/fastdeploy/ui/Utils.java b/java/android/ui/src/main/java/com/baidu/paddle/fastdeploy/ui/Utils.java
index 1303dd1ba..a5c6667da 100644
--- a/java/android/ui/src/main/java/com/baidu/paddle/fastdeploy/ui/Utils.java
+++ b/java/android/ui/src/main/java/com/baidu/paddle/fastdeploy/ui/Utils.java
@@ -6,6 +6,8 @@ import android.database.Cursor;
 import android.graphics.Bitmap;
 import android.graphics.BitmapFactory;
 import android.hardware.Camera;
+import android.net.ConnectivityManager;
+import android.net.NetworkInfo;
 import android.net.Uri;
 import android.opengl.GLES20;
 import android.os.Environment;
@@ -310,4 +312,28 @@ public class Utils {
         }
         return null;
     }
+
+    public static boolean isNetworkAvailable(final Context context) {
+        boolean hasWifoCon = false;
+        boolean hasMobileCon = false;
+
+        ConnectivityManager cm = (ConnectivityManager) context.getSystemService(context.CONNECTIVITY_SERVICE);
+        NetworkInfo[] netInfos = cm.getAllNetworkInfo();
+        for (NetworkInfo net : netInfos) {
+
+            String type = net.getTypeName();
+            if (type.equalsIgnoreCase("WIFI")) {
+                if (net.isConnected()) {
+                    hasWifoCon = true;
+                }
+            }
+
+            if (type.equalsIgnoreCase("MOBILE")) {
+                if (net.isConnected()) {
+                    hasMobileCon = true;
+                }
+            }
+        }
+        return hasWifoCon || hasMobileCon;
+    }
 }

From 29f034cf93d25f8a2b282d0b43cfd595ebe3640a Mon Sep 17 00:00:00 2001
From: yunyaoXYY <109218879+yunyaoXYY@users.noreply.github.com>
Date: Sun, 11 Dec 2022 14:16:13 +0800
Subject: [PATCH 18/77] [Quantization] Update auto compression configs files.
 (#846)

* Fix links in readme

* Fix links in readme

* Update PPOCRv2/v3 examples

* Update auto compression configs
---
 tools/README.md                                          | 7 +++----
 tools/README_EN.md                                       | 7 +++----
 tools/common_tools/auto_compression/README.md            | 7 +++----
 tools/common_tools/auto_compression/README_EN.md         | 9 +++------
 tools/common_tools/auto_compression/configs/README.md    | 2 +-
 tools/common_tools/auto_compression/configs/README_EN.md | 2 +-
 .../configs/classification/mobilenetv1_ssld_quant.yaml   | 2 +-
 .../configs/classification/resnet50_vd_quant.yaml        | 2 +-
 .../configs/detection/ppyoloe_plus_withNMS_quant.yaml    | 2 +-
 .../configs/detection/ppyoloe_withNMS_quant.yaml         | 2 +-
 .../configs/detection/yolov5s_quant.yaml                 | 2 +-
 .../configs/detection/yolov6s_quant.yaml                 | 3 ++-
 .../auto_compression/configs/detection/yolov7_quant.yaml | 2 +-
 .../configs/segmentation/pp_liteseg_quant.yaml           | 2 +-
 14 files changed, 23 insertions(+), 28 deletions(-)

diff --git a/tools/README.md b/tools/README.md
index 7a0e5b668..07c7ac8a6 100755
--- a/tools/README.md
+++ b/tools/README.md
@@ -11,15 +11,14 @@ FastDeploy提供了一系列高效易用的工具优化部署体验, 提升推
 FastDeploy基于PaddleSlim的Auto Compression Toolkit(ACT), 给用户提供了一键模型自动化压缩的工具, 用户可以轻松地通过一行命令对模型进行自动化压缩, 并在FastDeploy上部署压缩后的模型, 提升推理速度. 本文档将以FastDeploy一键模型自动化压缩工具为例, 介绍如何安装此工具, 并提供相应的使用文档.
 
 ### 环境准备
-1.用户参考PaddlePaddle官网, 安装develop版本
+1.用户参考PaddlePaddle官网, 安装Paddle 2.4 版本
 ```
 https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/develop/install/pip/linux-pip.html
 ```
 
-2.安装PaddleSlim develop版本
+2.安装PaddleSlim 2.4 版本
 ```bash
-git clone https://github.com/PaddlePaddle/PaddleSlim.git & cd PaddleSlim
-python setup.py install
+pip install paddleslim==2.4.0
 ```
 
 3.安装fastdeploy-tools工具包
diff --git a/tools/README_EN.md b/tools/README_EN.md
index 5c1e2501f..422b477d4 100755
--- a/tools/README_EN.md
+++ b/tools/README_EN.md
@@ -11,15 +11,14 @@ FastDeploy provides a series of efficient and easy-to-use tools to optimize the
 Based on PaddleSlim's Auto Compression Toolkit (ACT), FastDeploy provides users with a one-click model automation compression tool that allows users to easily compress the model with a single command. This document will take FastDeploy's one-click model automation compression tool as an example, introduce how to install the tool, and provide the corresponding documentation for usage.
 
 ### Environmental Preparation
-1.Install PaddlePaddle develop version
+1.Install PaddlePaddle 2.4 version
 ```
 https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/develop/install/pip/linux-pip.html
 ```
 
-2.Install PaddleSlim dev version
+2.Install PaddleSlim 2.4 version
 ```bash
-git clone https://github.com/PaddlePaddle/PaddleSlim.git & cd PaddleSlim
-python setup.py install
+pip install paddleslim==2.4.0
 ```
 
 3.Install fastdeploy-tools package
diff --git a/tools/common_tools/auto_compression/README.md b/tools/common_tools/auto_compression/README.md
index a990eeaa3..7c1b3feac 100644
--- a/tools/common_tools/auto_compression/README.md
+++ b/tools/common_tools/auto_compression/README.md
@@ -6,15 +6,14 @@ FastDeploy基于PaddleSlim的Auto Compression Toolkit(ACT), 给用户提供了
 
 ### 环境依赖
 
-1.用户参考PaddlePaddle官网, 安装develop版本
+1.用户参考PaddlePaddle官网, 安装Paddle 2.4 版本
 ```
 https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/develop/install/pip/linux-pip.html
 ```
 
-2.安装paddleslim-develop版本
+2.安装PaddleSlim 2.4 版本
 ```bash
-git clone https://github.com/PaddlePaddle/PaddleSlim.git & cd PaddleSlim
-python setup.py install
+pip install paddleslim==2.4.0
 ```
 
 ### 一键模型自动化压缩工具安装方式
diff --git a/tools/common_tools/auto_compression/README_EN.md b/tools/common_tools/auto_compression/README_EN.md
index 9c591208d..fb1480819 100644
--- a/tools/common_tools/auto_compression/README_EN.md
+++ b/tools/common_tools/auto_compression/README_EN.md
@@ -7,17 +7,14 @@ We take the Yolov5 series as an example to demonstrate how to install and execut
 
 ### Environment Dependencies
 
-1. Install the develop version downloaded from PaddlePaddle official website.
-
+1.Install PaddlePaddle 2.4 version
 ```
 https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/develop/install/pip/linux-pip.html
 ```
 
-2.Install PaddleSlim-develop
-
+2.Install PaddleSlim 2.4 version
 ```bash
-git clone https://github.com/PaddlePaddle/PaddleSlim.git & cd PaddleSlim
-python setup.py install
+pip install paddleslim==2.4.0
 ```
 
 ### Install Fastdeploy Auto Compression Toolkit
diff --git a/tools/common_tools/auto_compression/configs/README.md b/tools/common_tools/auto_compression/configs/README.md
index 992402656..3c71ad41d 100644
--- a/tools/common_tools/auto_compression/configs/README.md
+++ b/tools/common_tools/auto_compression/configs/README.md
@@ -24,7 +24,7 @@ Distillation:
   alpha: 1.0                                  #蒸馏loss所占权重
   loss: soft_label                            #蒸馏loss算法
 
-Quantization:
+QuantAware:
   onnx_format: true                           #是否采用ONNX量化标准格式, 要在FastDeploy上部署, 必须选true
   use_pact: true                              #量化训练是否使用PACT方法
   activation_quantize_type: 'moving_average_abs_max'     #激活量化方式
diff --git a/tools/common_tools/auto_compression/configs/README_EN.md b/tools/common_tools/auto_compression/configs/README_EN.md
index c1066409c..8381105eb 100644
--- a/tools/common_tools/auto_compression/configs/README_EN.md
+++ b/tools/common_tools/auto_compression/configs/README_EN.md
@@ -26,7 +26,7 @@ Distillation:
   alpha: 1.0                                  #Distillation loss weight
   loss: soft_label                            #Distillation loss algorithm
 
-Quantization:
+QuantAware:
   onnx_format: true                           #Whether to use ONNX quantization standard format or not, must be true to deploy on FastDeploy
   use_pact: true                              #Whether to use the PACT method for training
   activation_quantize_type: 'moving_average_abs_max'     #Activations quantization methods
diff --git a/tools/common_tools/auto_compression/configs/classification/mobilenetv1_ssld_quant.yaml b/tools/common_tools/auto_compression/configs/classification/mobilenetv1_ssld_quant.yaml
index 7fa979110..22fe14c63 100644
--- a/tools/common_tools/auto_compression/configs/classification/mobilenetv1_ssld_quant.yaml
+++ b/tools/common_tools/auto_compression/configs/classification/mobilenetv1_ssld_quant.yaml
@@ -17,7 +17,7 @@ Distillation:
   - softmax_0.tmp_0
 
 
-Quantization:
+QuantAware:
   use_pact: true
   activation_bits: 8
   is_full_quantize: false
diff --git a/tools/common_tools/auto_compression/configs/classification/resnet50_vd_quant.yaml b/tools/common_tools/auto_compression/configs/classification/resnet50_vd_quant.yaml
index 6de409ac7..4197bf3d5 100644
--- a/tools/common_tools/auto_compression/configs/classification/resnet50_vd_quant.yaml
+++ b/tools/common_tools/auto_compression/configs/classification/resnet50_vd_quant.yaml
@@ -16,7 +16,7 @@ Distillation:
   node:
   - softmax_0.tmp_0
 
-Quantization:
+QuantAware:
   use_pact: true
   activation_bits: 8
   is_full_quantize: false
diff --git a/tools/common_tools/auto_compression/configs/detection/ppyoloe_plus_withNMS_quant.yaml b/tools/common_tools/auto_compression/configs/detection/ppyoloe_plus_withNMS_quant.yaml
index 2b9f8d7a4..8c4f98257 100644
--- a/tools/common_tools/auto_compression/configs/detection/ppyoloe_plus_withNMS_quant.yaml
+++ b/tools/common_tools/auto_compression/configs/detection/ppyoloe_plus_withNMS_quant.yaml
@@ -14,7 +14,7 @@ Distillation:
   alpha: 1.0
   loss: soft_label
 
-Quantization:
+QuantAware:
   onnx_format: true
   use_pact: true
   activation_quantize_type: 'moving_average_abs_max'
diff --git a/tools/common_tools/auto_compression/configs/detection/ppyoloe_withNMS_quant.yaml b/tools/common_tools/auto_compression/configs/detection/ppyoloe_withNMS_quant.yaml
index e46c11b27..2d1a2536b 100644
--- a/tools/common_tools/auto_compression/configs/detection/ppyoloe_withNMS_quant.yaml
+++ b/tools/common_tools/auto_compression/configs/detection/ppyoloe_withNMS_quant.yaml
@@ -14,7 +14,7 @@ Distillation:
   alpha: 1.0
   loss: soft_label
 
-Quantization:
+QuantAware:
   onnx_format: true
   use_pact: true
   activation_quantize_type: 'moving_average_abs_max'
diff --git a/tools/common_tools/auto_compression/configs/detection/yolov5s_quant.yaml b/tools/common_tools/auto_compression/configs/detection/yolov5s_quant.yaml
index 72cfef9ba..9d6b507cf 100644
--- a/tools/common_tools/auto_compression/configs/detection/yolov5s_quant.yaml
+++ b/tools/common_tools/auto_compression/configs/detection/yolov5s_quant.yaml
@@ -14,7 +14,7 @@ Distillation:
   alpha: 1.0
   loss: soft_label
 
-Quantization:
+QuantAware:
   onnx_format: true
   use_pact: true
   activation_quantize_type: 'moving_average_abs_max'
diff --git a/tools/common_tools/auto_compression/configs/detection/yolov6s_quant.yaml b/tools/common_tools/auto_compression/configs/detection/yolov6s_quant.yaml
index ee4986312..44b8bd472 100644
--- a/tools/common_tools/auto_compression/configs/detection/yolov6s_quant.yaml
+++ b/tools/common_tools/auto_compression/configs/detection/yolov6s_quant.yaml
@@ -14,12 +14,13 @@ Distillation:
   alpha: 1.0
   loss: soft_label
 
-Quantization:
+QuantAware:
   onnx_format: true
   activation_quantize_type: 'moving_average_abs_max'
   quantize_op_types:
   - conv2d
   - depthwise_conv2d
+  - conv2d_transpose
 
 
 PTQ:
diff --git a/tools/common_tools/auto_compression/configs/detection/yolov7_quant.yaml b/tools/common_tools/auto_compression/configs/detection/yolov7_quant.yaml
index e6cc2c9a9..5e056e94c 100644
--- a/tools/common_tools/auto_compression/configs/detection/yolov7_quant.yaml
+++ b/tools/common_tools/auto_compression/configs/detection/yolov7_quant.yaml
@@ -14,7 +14,7 @@ Distillation:
   alpha: 1.0
   loss: soft_label
 
-Quantization:
+QuantAware:
   onnx_format: true
   activation_quantize_type: 'moving_average_abs_max'
   quantize_op_types:
diff --git a/tools/common_tools/auto_compression/configs/segmentation/pp_liteseg_quant.yaml b/tools/common_tools/auto_compression/configs/segmentation/pp_liteseg_quant.yaml
index 9c04f65d3..beddb370d 100644
--- a/tools/common_tools/auto_compression/configs/segmentation/pp_liteseg_quant.yaml
+++ b/tools/common_tools/auto_compression/configs/segmentation/pp_liteseg_quant.yaml
@@ -17,7 +17,7 @@ Distillation:
   node:
   - conv2d_94.tmp_0
 
-Quantization:
+QuantAware:
   onnx_format: True
   quantize_op_types:
   - conv2d

From 8e13a38bf53dada691fda6ef9b3a6a4829a3beef Mon Sep 17 00:00:00 2001
From: WJJ1995 <wjjisloser@163.com>
Date: Sun, 11 Dec 2022 14:16:37 +0800
Subject: [PATCH 19/77] [Backend] Modify trt_max_batch_size the default value
 to 1 (#817)

* add onnx_ort_runtime demo

* rm in requirements

* support batch eval

* fixed MattingResults bug

* move assignment for DetectionResult

* integrated x2paddle

* add model convert readme

* update readme

* re-lint

* add processor api

* Add MattingResult Free

* change valid_cpu_backends order

* add ppocr benchmark

* mv bs from 64 to 32

* fixed quantize.md

* fixed quantize bugs

* Add Monitor for benchmark

* update mem monitor

* Set trt_max_batch_size default 1

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 benchmark/convert_info.py | 10 ++++------
 fastdeploy/runtime.h      |  2 +-
 2 files changed, 5 insertions(+), 7 deletions(-)
 mode change 100644 => 100755 fastdeploy/runtime.h

diff --git a/benchmark/convert_info.py b/benchmark/convert_info.py
index 338a0cec5..e5942e1f7 100644
--- a/benchmark/convert_info.py
+++ b/benchmark/convert_info.py
@@ -70,10 +70,8 @@ for i in range(line_nums):
                 cpu_rss_mb_list = cpu_rss_mb_ori.split(".")
                 cpu_rss_mb = cpu_rss_mb_list[0] + "." + cpu_rss_mb_list[1][:2]
             if "gpu_rss_mb" in lines[i + 4]:
-                gpu_rss_mb_ori = lines[i + 4].split(": ")[1]
-                # two decimal places
-                gpu_rss_mb_list = gpu_rss_mb_ori.split(".")
-                gpu_rss_mb = gpu_rss_mb_list[0] + "." + gpu_rss_mb_list[1][:2]
+                gpu_rss_mb_ori = lines[i + 4].split(": ")[1].strip()
+                gpu_rss_mb = str(gpu_rss_mb_ori) + ".0"
         if "ort_cpu_1" in lines[i]:
             ort_cpu_thread1[
                 model_name] = runtime + "\t" + end2end + "\t" + cpu_rss_mb
@@ -111,7 +109,7 @@ for i in range(line_nums):
 
 f2 = open("struct_cpu_" + domain + ".txt", "w")
 f2.writelines(
-    "model_name\tthread_nums\tort_run\tort_end2end\tcpu_rss_mb\tov_run\tov_end2end\tcpu_rss_mb\tpaddle_run\tpaddle_end2end\tcpu_rss_mb\n"
+    "model_name\tthread_nums\tort_run\tort_end2end\tcpu_mem\tov_run\tov_end2end\tcpu_mem\tpaddle_run\tpaddle_end2end\tcpu_mem\n"
 )
 for model_name in model_name_set:
     lines1 = model_name + '\t1\t'
@@ -148,7 +146,7 @@ f2.close()
 
 f3 = open("struct_gpu_" + domain + ".txt", "w")
 f3.writelines(
-    "model_name\tort_run\tort_end2end\tgpu_rss_mb\tpaddle_run\tpaddle_end2end\tgpu_rss_mb\tpaddle_trt_run\tpaddle_trt_end2end\tgpu_rss_mb\tpaddle_trt_fp16_run\tpaddle_trt_fp16_end2end\tgpu_rss_mb\ttrt_run\ttrt_end2end\tgpu_rss_mb\ttrt_fp16_run\ttrt_fp16_end2end\tgpu_rss_mb\n"
+    "model_name\tort_run\tort_end2end\tgpu_mem\tpaddle_run\tpaddle_end2end\tgpu_mem\tpaddle_trt_run\tpaddle_trt_end2end\tgpu_mem\tpaddle_trt_fp16_run\tpaddle_trt_fp16_end2end\tgpu_mem\ttrt_run\ttrt_end2end\tgpu_mem\ttrt_fp16_run\ttrt_fp16_end2end\tgpu_mem\n"
 )
 for model_name in model_name_set:
     lines1 = model_name + '\t'
diff --git a/fastdeploy/runtime.h b/fastdeploy/runtime.h
old mode 100644
new mode 100755
index e53c7ca1e..9c22c929f
--- a/fastdeploy/runtime.h
+++ b/fastdeploy/runtime.h
@@ -362,7 +362,7 @@ struct FASTDEPLOY_DECL RuntimeOption {
   std::string trt_serialize_file = "";
   bool trt_enable_fp16 = false;
   bool trt_enable_int8 = false;
-  size_t trt_max_batch_size = 32;
+  size_t trt_max_batch_size = 1;
   size_t trt_max_workspace_size = 1 << 30;
   // ======Only for PaddleTrt Backend=======
   std::vector<std::string> trt_disabled_ops_{};

From 99165f2149f351bb1c54b1a303ce083b2eb8efc1 Mon Sep 17 00:00:00 2001
From: DefTruth <31974251+DefTruth@users.noreply.github.com>
Date: Mon, 12 Dec 2022 09:46:55 +0800
Subject: [PATCH 20/77] [Bug Fix] fix win examples build error (#855)

* Update CMakeLists.txt

* Update infer_rkyolo.cc
---
 examples/CMakeLists.txt                              | 5 +++++
 examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc | 2 --
 2 files changed, 5 insertions(+), 2 deletions(-)

diff --git a/examples/CMakeLists.txt b/examples/CMakeLists.txt
index 8aa469b6a..ee46e64b9 100755
--- a/examples/CMakeLists.txt
+++ b/examples/CMakeLists.txt
@@ -51,6 +51,11 @@ function(add_fastdeploy_executable FIELD CC_FILE)
     if(TARGET gflags)
       if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
         target_link_libraries(${TEMP_TARGET_NAME} PRIVATE gflags pthread)
+      elseif(WIN32)
+        target_link_libraries(${TEMP_TARGET_NAME} PRIVATE gflags)
+        if (HAVE_SHLWAPI)
+          target_link_libraries(${TEMP_TARGET_NAME} PRIVATE shlwapi.lib)
+        endif()  
       else()
         target_link_libraries(${TEMP_TARGET_NAME} PRIVATE gflags)
       endif()
diff --git a/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc b/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
index c7c1be43b..86ba7f985 100644
--- a/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
+++ b/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
@@ -14,8 +14,6 @@
 #include "fastdeploy/vision.h"
 
 void RKNPU2Infer(const std::string& model_file, const std::string& image_file) {
-  struct timeval start_time, stop_time;
-
   auto option = fastdeploy::RuntimeOption();
   option.UseRKNPU2();
 

From 19008a239757f4150cda512909ac30c2d6c99278 Mon Sep 17 00:00:00 2001
From: huangjianhui <852142024@qq.com>
Date: Mon, 12 Dec 2022 09:47:54 +0800
Subject: [PATCH 21/77] [Other]Update im.copy() to im in examples (#854)

* Update keypointdetection result docs

* Update im.copy() to im in examples
---
 examples/vision/classification/resnet/python/infer.py         | 2 +-
 examples/vision/classification/yolov5cls/python/infer.py      | 2 +-
 examples/vision/detection/nanodet_plus/python/infer.py        | 2 +-
 examples/vision/detection/scaledyolov4/python/infer.py        | 2 +-
 examples/vision/detection/yolor/python/infer.py               | 2 +-
 examples/vision/detection/yolov5/python/infer.py              | 2 +-
 examples/vision/detection/yolov5/quantize/python/infer.py     | 2 +-
 examples/vision/detection/yolov5lite/python/infer.py          | 2 +-
 examples/vision/detection/yolov6/python/infer.py              | 2 +-
 examples/vision/detection/yolov6/quantize/python/infer.py     | 2 +-
 examples/vision/detection/yolov7/python/infer.py              | 2 +-
 examples/vision/detection/yolov7/quantize/python/infer.py     | 2 +-
 examples/vision/detection/yolov7end2end_ort/python/infer.py   | 2 +-
 examples/vision/detection/yolov7end2end_trt/python/infer.py   | 2 +-
 examples/vision/detection/yolox/python/infer.py               | 2 +-
 examples/vision/facealign/face_landmark_1000/python/infer.py  | 2 +-
 examples/vision/facealign/pfld/python/infer.py                | 2 +-
 examples/vision/facealign/pipnet/python/infer.py              | 2 +-
 examples/vision/facedet/retinaface/python/infer.py            | 2 +-
 examples/vision/facedet/scrfd/python/infer.py                 | 2 +-
 examples/vision/facedet/scrfd/rknpu2/python/infer.py          | 2 +-
 examples/vision/facedet/ultraface/python/infer.py             | 2 +-
 examples/vision/facedet/yolov5face/python/infer.py            | 2 +-
 examples/vision/headpose/fsanet/python/infer.py               | 2 +-
 examples/vision/matting/modnet/python/infer.py                | 2 +-
 examples/vision/matting/ppmatting/python/infer.py             | 2 +-
 examples/vision/matting/rvm/python/infer.py                   | 4 ++--
 examples/vision/segmentation/paddleseg/python/infer.py        | 2 +-
 .../vision/segmentation/paddleseg/quantize/python/infer.py    | 2 +-
 examples/vision/segmentation/paddleseg/rknpu2/python/infer.py | 2 +-
 30 files changed, 31 insertions(+), 31 deletions(-)

diff --git a/examples/vision/classification/resnet/python/infer.py b/examples/vision/classification/resnet/python/infer.py
index b8b268f3a..ba22304fc 100644
--- a/examples/vision/classification/resnet/python/infer.py
+++ b/examples/vision/classification/resnet/python/infer.py
@@ -46,5 +46,5 @@ model = fd.vision.classification.ResNet(
     args.model, runtime_option=runtime_option)
 # 预测图片分类结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy(), args.topk)
+result = model.predict(im, args.topk)
 print(result)
diff --git a/examples/vision/classification/yolov5cls/python/infer.py b/examples/vision/classification/yolov5cls/python/infer.py
index 576db32f2..55974a764 100644
--- a/examples/vision/classification/yolov5cls/python/infer.py
+++ b/examples/vision/classification/yolov5cls/python/infer.py
@@ -47,5 +47,5 @@ model = fd.vision.classification.YOLOv5Cls(
 
 # 预测图片分类结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy(), args.topk)
+result = model.predict(im, args.topk)
 print(result)
diff --git a/examples/vision/detection/nanodet_plus/python/infer.py b/examples/vision/detection/nanodet_plus/python/infer.py
index 9e7bf184f..a60f3a3b4 100644
--- a/examples/vision/detection/nanodet_plus/python/infer.py
+++ b/examples/vision/detection/nanodet_plus/python/infer.py
@@ -52,7 +52,7 @@ if args.image is None:
 else:
     image = args.image
 im = cv2.imread(image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/scaledyolov4/python/infer.py b/examples/vision/detection/scaledyolov4/python/infer.py
index 9d990d77b..cd23e84e3 100644
--- a/examples/vision/detection/scaledyolov4/python/infer.py
+++ b/examples/vision/detection/scaledyolov4/python/infer.py
@@ -52,7 +52,7 @@ if args.image is None:
 else:
     image = args.image
 im = cv2.imread(image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolor/python/infer.py b/examples/vision/detection/yolor/python/infer.py
index d5ab3dd7f..4111fa0ae 100644
--- a/examples/vision/detection/yolor/python/infer.py
+++ b/examples/vision/detection/yolor/python/infer.py
@@ -54,7 +54,7 @@ else:
     image = args.image
 
 im = cv2.imread(image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolov5/python/infer.py b/examples/vision/detection/yolov5/python/infer.py
index fdded06c9..462740e9c 100644
--- a/examples/vision/detection/yolov5/python/infer.py
+++ b/examples/vision/detection/yolov5/python/infer.py
@@ -52,7 +52,7 @@ if args.image is None:
 else:
     image = args.image
 im = cv2.imread(image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolov5/quantize/python/infer.py b/examples/vision/detection/yolov5/quantize/python/infer.py
index da502fe93..996bc5419 100644
--- a/examples/vision/detection/yolov5/quantize/python/infer.py
+++ b/examples/vision/detection/yolov5/quantize/python/infer.py
@@ -71,7 +71,7 @@ model = fd.vision.detection.YOLOv5(
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolov5lite/python/infer.py b/examples/vision/detection/yolov5lite/python/infer.py
index b1ec69046..2242a33a5 100644
--- a/examples/vision/detection/yolov5lite/python/infer.py
+++ b/examples/vision/detection/yolov5lite/python/infer.py
@@ -52,7 +52,7 @@ if args.image is None:
 else:
     image = args.image
 im = cv2.imread(image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolov6/python/infer.py b/examples/vision/detection/yolov6/python/infer.py
index 0a0a163fb..47bf3e689 100644
--- a/examples/vision/detection/yolov6/python/infer.py
+++ b/examples/vision/detection/yolov6/python/infer.py
@@ -52,7 +52,7 @@ if args.image is None:
 else:
     image = args.image
 im = cv2.imread(image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolov6/quantize/python/infer.py b/examples/vision/detection/yolov6/quantize/python/infer.py
index da9fa3d97..77f46d4c2 100644
--- a/examples/vision/detection/yolov6/quantize/python/infer.py
+++ b/examples/vision/detection/yolov6/quantize/python/infer.py
@@ -71,7 +71,7 @@ model = fd.vision.detection.YOLOv6(
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolov7/python/infer.py b/examples/vision/detection/yolov7/python/infer.py
index b0ece7e47..468b47dc5 100644
--- a/examples/vision/detection/yolov7/python/infer.py
+++ b/examples/vision/detection/yolov7/python/infer.py
@@ -52,7 +52,7 @@ if args.image is None:
 else:
     image = args.image
 im = cv2.imread(image)
-result = model.predict(im.copy())
+result = model.predict(im)
 
 # 预测结果可视化
 vis_im = fd.vision.vis_detection(im, result)
diff --git a/examples/vision/detection/yolov7/quantize/python/infer.py b/examples/vision/detection/yolov7/quantize/python/infer.py
index de84e4061..d07834c7c 100644
--- a/examples/vision/detection/yolov7/quantize/python/infer.py
+++ b/examples/vision/detection/yolov7/quantize/python/infer.py
@@ -71,7 +71,7 @@ model = fd.vision.detection.YOLOv7(
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolov7end2end_ort/python/infer.py b/examples/vision/detection/yolov7end2end_ort/python/infer.py
index 2b812b71a..914facb59 100644
--- a/examples/vision/detection/yolov7end2end_ort/python/infer.py
+++ b/examples/vision/detection/yolov7end2end_ort/python/infer.py
@@ -44,7 +44,7 @@ model = fd.vision.detection.YOLOv7End2EndORT(
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolov7end2end_trt/python/infer.py b/examples/vision/detection/yolov7end2end_trt/python/infer.py
index d179de06f..b1ad8ea0c 100644
--- a/examples/vision/detection/yolov7end2end_trt/python/infer.py
+++ b/examples/vision/detection/yolov7end2end_trt/python/infer.py
@@ -44,7 +44,7 @@ model = fd.vision.detection.YOLOv7End2EndTRT(
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 预测结果可视化
diff --git a/examples/vision/detection/yolox/python/infer.py b/examples/vision/detection/yolox/python/infer.py
index 69203010b..c5e71754a 100644
--- a/examples/vision/detection/yolox/python/infer.py
+++ b/examples/vision/detection/yolox/python/infer.py
@@ -52,7 +52,7 @@ if args.image is None:
 else:
     image = args.image
 im = cv2.imread(image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 预测结果可视化
 vis_im = fd.vision.vis_detection(im, result)
diff --git a/examples/vision/facealign/face_landmark_1000/python/infer.py b/examples/vision/facealign/face_landmark_1000/python/infer.py
index bbb3a19c8..9eaedfb63 100644
--- a/examples/vision/facealign/face_landmark_1000/python/infer.py
+++ b/examples/vision/facealign/face_landmark_1000/python/infer.py
@@ -82,7 +82,7 @@ model = fd.vision.facealign.FaceLandmark1000(
 
 # for image
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 可视化结果
 vis_im = fd.vision.vis_face_alignment(im, result)
diff --git a/examples/vision/facealign/pfld/python/infer.py b/examples/vision/facealign/pfld/python/infer.py
index 622fbf822..0a695e8c6 100755
--- a/examples/vision/facealign/pfld/python/infer.py
+++ b/examples/vision/facealign/pfld/python/infer.py
@@ -80,7 +80,7 @@ model = fd.vision.facealign.PFLD(args.model, runtime_option=runtime_option)
 
 # for image
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 可视化结果
 vis_im = fd.vision.vis_face_alignment(im, result)
diff --git a/examples/vision/facealign/pipnet/python/infer.py b/examples/vision/facealign/pipnet/python/infer.py
index 628b86f79..46f9c2d90 100644
--- a/examples/vision/facealign/pipnet/python/infer.py
+++ b/examples/vision/facealign/pipnet/python/infer.py
@@ -85,7 +85,7 @@ model = fd.vision.facealign.PIPNet(args.model, runtime_option=runtime_option)
 model.num_landmarks = args.num_landmarks
 # for image
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 可视化结果
 vis_im = fd.vision.vis_face_alignment(im, result)
diff --git a/examples/vision/facedet/retinaface/python/infer.py b/examples/vision/facedet/retinaface/python/infer.py
index 3b0152b1c..6b7f63e5e 100644
--- a/examples/vision/facedet/retinaface/python/infer.py
+++ b/examples/vision/facedet/retinaface/python/infer.py
@@ -43,7 +43,7 @@ model = fd.vision.facedet.RetinaFace(args.model, runtime_option=runtime_option)
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 预测结果可视化
 vis_im = fd.vision.vis_face_detection(im, result)
diff --git a/examples/vision/facedet/scrfd/python/infer.py b/examples/vision/facedet/scrfd/python/infer.py
index a99e66385..af141e011 100644
--- a/examples/vision/facedet/scrfd/python/infer.py
+++ b/examples/vision/facedet/scrfd/python/infer.py
@@ -43,7 +43,7 @@ model = fd.vision.facedet.SCRFD(args.model, runtime_option=runtime_option)
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 预测结果可视化
 vis_im = fd.vision.vis_face_detection(im, result)
diff --git a/examples/vision/facedet/scrfd/rknpu2/python/infer.py b/examples/vision/facedet/scrfd/rknpu2/python/infer.py
index 3b3fc9d83..77e57a0f1 100644
--- a/examples/vision/facedet/scrfd/rknpu2/python/infer.py
+++ b/examples/vision/facedet/scrfd/rknpu2/python/infer.py
@@ -49,7 +49,7 @@ model.disable_normalize_and_permute()
 
 # 预测图片分割结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 可视化结果
diff --git a/examples/vision/facedet/ultraface/python/infer.py b/examples/vision/facedet/ultraface/python/infer.py
index 5399110b9..2087ce5bf 100644
--- a/examples/vision/facedet/ultraface/python/infer.py
+++ b/examples/vision/facedet/ultraface/python/infer.py
@@ -43,7 +43,7 @@ model = fd.vision.facedet.UltraFace(args.model, runtime_option=runtime_option)
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 预测结果可视化
 vis_im = fd.vision.vis_face_detection(im, result)
diff --git a/examples/vision/facedet/yolov5face/python/infer.py b/examples/vision/facedet/yolov5face/python/infer.py
index a9f044682..ca907afb4 100644
--- a/examples/vision/facedet/yolov5face/python/infer.py
+++ b/examples/vision/facedet/yolov5face/python/infer.py
@@ -43,7 +43,7 @@ model = fd.vision.facedet.YOLOv5Face(args.model, runtime_option=runtime_option)
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 预测结果可视化
 vis_im = fd.vision.vis_face_detection(im, result)
diff --git a/examples/vision/headpose/fsanet/python/infer.py b/examples/vision/headpose/fsanet/python/infer.py
index 866ce6d5c..488e35153 100644
--- a/examples/vision/headpose/fsanet/python/infer.py
+++ b/examples/vision/headpose/fsanet/python/infer.py
@@ -80,7 +80,7 @@ model = fd.vision.headpose.FSANet(args.model, runtime_option=runtime_option)
 
 # for image
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 可视化结果
 vis_im = fd.vision.vis_headpose(im, result)
diff --git a/examples/vision/matting/modnet/python/infer.py b/examples/vision/matting/modnet/python/infer.py
index 408ba2340..abb9be037 100644
--- a/examples/vision/matting/modnet/python/infer.py
+++ b/examples/vision/matting/modnet/python/infer.py
@@ -52,7 +52,7 @@ model.size = (256, 256)
 # 预测图片抠图结果
 im = cv2.imread(args.image)
 bg = cv2.imread(args.bg)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 可视化结果
 vis_im = fd.vision.vis_matting_alpha(im, result)
diff --git a/examples/vision/matting/ppmatting/python/infer.py b/examples/vision/matting/ppmatting/python/infer.py
index 61031e1b6..32a81eca7 100644
--- a/examples/vision/matting/ppmatting/python/infer.py
+++ b/examples/vision/matting/ppmatting/python/infer.py
@@ -56,7 +56,7 @@ model = fd.vision.matting.PPMatting(
 # 预测图片抠图结果
 im = cv2.imread(args.image)
 bg = cv2.imread(args.bg)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 # 可视化结果
 vis_im = fd.vision.vis_matting(im, result)
diff --git a/examples/vision/matting/rvm/python/infer.py b/examples/vision/matting/rvm/python/infer.py
index 11951b00f..fcde64fb2 100755
--- a/examples/vision/matting/rvm/python/infer.py
+++ b/examples/vision/matting/rvm/python/infer.py
@@ -73,7 +73,7 @@ if args.video is not None:
     # for video
     cap = cv2.VideoCapture(args.video)
     # Define the codec and create VideoWriter object
-    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+    fourcc = cv2.VideoWriter_fourcc('m', 'p', '4', 'v')
     composition = cv2.VideoWriter(output_composition, fourcc, 20.0,
                                   (1080, 1920))
     alpha = cv2.VideoWriter(output_alpha, fourcc, 20.0, (1080, 1920))
@@ -100,7 +100,7 @@ if args.video is not None:
 if args.image is not None:
     # for image
     im = cv2.imread(args.image)
-    result = model.predict(im.copy())
+    result = model.predict(im)
     print(result)
     # 可视化结果
     vis_im = fd.vision.vis_matting(im, result)
diff --git a/examples/vision/segmentation/paddleseg/python/infer.py b/examples/vision/segmentation/paddleseg/python/infer.py
index 866e32bfb..9df7665a2 100644
--- a/examples/vision/segmentation/paddleseg/python/infer.py
+++ b/examples/vision/segmentation/paddleseg/python/infer.py
@@ -49,7 +49,7 @@ model = fd.vision.segmentation.PaddleSegModel(
 
 # 预测图片分割结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 可视化结果
diff --git a/examples/vision/segmentation/paddleseg/quantize/python/infer.py b/examples/vision/segmentation/paddleseg/quantize/python/infer.py
index f95f04d17..85a875c1e 100644
--- a/examples/vision/segmentation/paddleseg/quantize/python/infer.py
+++ b/examples/vision/segmentation/paddleseg/quantize/python/infer.py
@@ -72,5 +72,5 @@ model = fd.vision.segmentation.PaddleSegModel(
 
 # 预测图片检测结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
diff --git a/examples/vision/segmentation/paddleseg/rknpu2/python/infer.py b/examples/vision/segmentation/paddleseg/rknpu2/python/infer.py
index 8841132a9..d7239eb42 100644
--- a/examples/vision/segmentation/paddleseg/rknpu2/python/infer.py
+++ b/examples/vision/segmentation/paddleseg/rknpu2/python/infer.py
@@ -53,7 +53,7 @@ model.disable_normalize_and_permute()
 
 # 预测图片分割结果
 im = cv2.imread(args.image)
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 # 可视化结果

From 5b54bcfb480f96c06683b1b117012b662c4c9916 Mon Sep 17 00:00:00 2001
From: DefTruth <31974251+DefTruth@users.noreply.github.com>
Date: Mon, 12 Dec 2022 09:54:08 +0800
Subject: [PATCH 22/77] [ARM] fix VisSegmentation background error with bit ops
 (#852)

* [NEON] fix visseg background error with bit ops

* [Bug Fix] fix build_android_aar.sh ci scripts

* [Bug Fix] fix VisSegmentationCommonCpu
---
 fastdeploy/vision/visualize/segmentation.cc | 71 ++++++++++++++-------
 scripts/android/build_android_aar.sh        |  2 +-
 2 files changed, 49 insertions(+), 24 deletions(-)

diff --git a/fastdeploy/vision/visualize/segmentation.cc b/fastdeploy/vision/visualize/segmentation.cc
index 9e4fe4149..37d0f572e 100644
--- a/fastdeploy/vision/visualize/segmentation.cc
+++ b/fastdeploy/vision/visualize/segmentation.cc
@@ -25,7 +25,7 @@ namespace fastdeploy {
 namespace vision {
 
 #ifdef __ARM_NEON  
-static constexpr int VIS_SEG_OMP_NUM_THREADS=2;
+static constexpr int VIS_SEG_OMP_NUM_THREADS = 2;
 
 static inline void QuantizeBlendingWeight8(
   float weight, uint8_t* old_multi_factor, uint8_t* new_multi_factor) {
@@ -55,15 +55,25 @@ static cv::Mat FastVisSegmentationNEON(
   const uint8_t *im_ptr = static_cast<const uint8_t*>(im.data);
 
   if (!quantize_weight) {
+    uint8x16_t zerox16 = vdupq_n_u8(0);
     #pragma omp parallel for proc_bind(close) \
     num_threads(VIS_SEG_OMP_NUM_THREADS) schedule(static)
     for (int i = 0; i < size - 15; i += 16) {
+      uint8x16x3_t bgrx16x3 = vld3q_u8(im_ptr + i * 3);  // 48 bytes
       uint8x16_t labelx16 = vld1q_u8(label_ptr + i); // 16 bytes
+      uint8x16_t ibx16 = bgrx16x3.val[0];
+      uint8x16_t igx16 = bgrx16x3.val[1];
+      uint8x16_t irx16 = bgrx16x3.val[2];
       // e.g 0b00000001 << 7 -> 0b10000000 128;
+      uint8x16_t mbx16 = vshlq_n_u8(labelx16, 7); 
+      uint8x16_t mgx16 = vshlq_n_u8(labelx16, 4); 
+      uint8x16_t mrx16 = vshlq_n_u8(labelx16, 3); 
       uint8x16x3_t vbgrx16x3;
-      vbgrx16x3.val[0] = vshlq_n_u8(labelx16, 7); 
-      vbgrx16x3.val[1] = vshlq_n_u8(labelx16, 4); 
-      vbgrx16x3.val[2] = vshlq_n_u8(labelx16, 3); 
+      // Keep the pixels of input im if mask = 0
+      uint8x16_t cezx16 = vceqq_u8(labelx16, zerox16);
+      vbgrx16x3.val[0] = vorrq_u8(vandq_u8(cezx16, ibx16), mbx16);
+      vbgrx16x3.val[1] = vorrq_u8(vandq_u8(cezx16, igx16), mgx16);
+      vbgrx16x3.val[2] = vorrq_u8(vandq_u8(cezx16, irx16), mrx16);
       vst3q_u8(vis_ptr + i * 3, vbgrx16x3);
     }
     for (int i = size - 15; i < size; i++) {
@@ -72,7 +82,7 @@ static cv::Mat FastVisSegmentationNEON(
       vis_ptr[i * 3 + 1] = (label << 4); 
       vis_ptr[i * 3 + 2] = (label << 3); 
     }
-    // Blend colors use opencv
+    // Blend the colors use OpenCV
     cv::addWeighted(im, 1.0 - weight, vis_img, weight, 0, vis_img);
     return vis_img;
   }
@@ -113,8 +123,9 @@ static cv::Mat FastVisSegmentationNEON(
     return vis_img;
   }
   
-  uint8x16_t old_mulx16 = vdupq_n_u8(old_multi_factor);
-  uint8x16_t new_mulx16 = vdupq_n_u8(new_multi_factor);
+  uint8x16_t zerox16 = vdupq_n_u8(0);
+  uint8x16_t old_fx16 = vdupq_n_u8(old_multi_factor);
+  uint8x16_t new_fx16 = vdupq_n_u8(new_multi_factor);
   // Blend the two colors together with quantize 'weight'.
   #pragma omp parallel for proc_bind(close) \
   num_threads(VIS_SEG_OMP_NUM_THREADS) schedule(static)
@@ -128,21 +139,29 @@ static cv::Mat FastVisSegmentationNEON(
     uint8x16_t mbx16 = vshlq_n_u8(labelx16, 7); 
     uint8x16_t mgx16 = vshlq_n_u8(labelx16, 4); 
     uint8x16_t mrx16 = vshlq_n_u8(labelx16, 3); 
-    // TODO: keep the pixels of input im if mask = 0
-    uint8x16_t ibx16_mshr, igx16_mshr, irx16_mshr;
-    uint8x16_t mbx16_mshr, mgx16_mshr, mrx16_mshr;
     // Moving 7 bits to the right tends to result in zero,
     // So, We choose to shift 3 bits to get an approximation 
-    ibx16_mshr = vmulq_u8(vshrq_n_u8(ibx16, 3), old_mulx16);
-    igx16_mshr = vmulq_u8(vshrq_n_u8(igx16, 3), old_mulx16);   
-    irx16_mshr = vmulq_u8(vshrq_n_u8(irx16, 3), old_mulx16);
-    mbx16_mshr = vmulq_u8(vshrq_n_u8(mbx16, 3), new_mulx16);
-    mgx16_mshr = vmulq_u8(vshrq_n_u8(mgx16, 3), new_mulx16);
-    mrx16_mshr = vmulq_u8(vshrq_n_u8(mrx16, 3), new_mulx16);  
-    uint8x16x3_t vbgr16x3;
-    vbgr16x3.val[0] = vaddq_u8(ibx16_mshr, mbx16_mshr);
-    vbgr16x3.val[1] = vaddq_u8(igx16_mshr, mgx16_mshr);
-    vbgr16x3.val[2] = vaddq_u8(irx16_mshr, mrx16_mshr);
+    uint8x16_t ibx16_mshr = vmulq_u8(vshrq_n_u8(ibx16, 3), old_fx16);
+    uint8x16_t igx16_mshr = vmulq_u8(vshrq_n_u8(igx16, 3), old_fx16);   
+    uint8x16_t irx16_mshr = vmulq_u8(vshrq_n_u8(irx16, 3), old_fx16);
+    uint8x16_t mbx16_mshr = vmulq_u8(vshrq_n_u8(mbx16, 3), new_fx16);
+    uint8x16_t mgx16_mshr = vmulq_u8(vshrq_n_u8(mgx16, 3), new_fx16);
+    uint8x16_t mrx16_mshr = vmulq_u8(vshrq_n_u8(mrx16, 3), new_fx16);  
+    uint8x16_t qbx16 = vqaddq_u8(ibx16_mshr, mbx16_mshr);
+    uint8x16_t qgx16 = vqaddq_u8(igx16_mshr, mgx16_mshr);
+    uint8x16_t qrx16 = vqaddq_u8(irx16_mshr, mrx16_mshr);
+    // Keep the pixels of input im if label = 0 (means mask = 0)
+    uint8x16_t cezx16 = vceqq_u8(labelx16, zerox16);
+    uint8x16_t abx16 = vandq_u8(cezx16, ibx16);
+    uint8x16_t agx16 = vandq_u8(cezx16, igx16);
+    uint8x16_t arx16 = vandq_u8(cezx16, irx16);
+    uint8x16x3_t vbgr16x3;  
+    // Reset qx values to 0 if label is 0, then, keep mask values 
+    // if label is not 0  
+    uint8x16_t ncezx16 = vmvnq_u8(cezx16); 
+    vbgr16x3.val[0] = vorrq_u8(abx16, vandq_u8(ncezx16, qbx16));
+    vbgr16x3.val[1] = vorrq_u8(agx16, vandq_u8(ncezx16, qgx16));
+    vbgr16x3.val[2] = vorrq_u8(arx16, vandq_u8(ncezx16, qrx16));
     // Store the blended pixels to vis img
     vst3q_u8(vis_ptr + i * 3, vbgr16x3);
   }
@@ -172,9 +191,15 @@ static cv::Mat VisSegmentationCommonCpu(
   for (int i = 0; i < height; i++) {
     for (int j = 0; j < width; j++) {
       int category_id = result.label_map[index++];
-      vis_img.at<cv::Vec3b>(i, j)[0] = color_map[3 * category_id + 0];
-      vis_img.at<cv::Vec3b>(i, j)[1] = color_map[3 * category_id + 1];
-      vis_img.at<cv::Vec3b>(i, j)[2] = color_map[3 * category_id + 2];
+      if (category_id == 0) {
+        vis_img.at<cv::Vec3b>(i, j)[0] = im.at<cv::Vec3b>(i, j)[0];
+        vis_img.at<cv::Vec3b>(i, j)[1] = im.at<cv::Vec3b>(i, j)[1];
+        vis_img.at<cv::Vec3b>(i, j)[2] = im.at<cv::Vec3b>(i, j)[2];
+      } else {
+        vis_img.at<cv::Vec3b>(i, j)[0] = color_map[3 * category_id + 0];
+        vis_img.at<cv::Vec3b>(i, j)[1] = color_map[3 * category_id + 1];
+        vis_img.at<cv::Vec3b>(i, j)[2] = color_map[3 * category_id + 2];
+      }
     }
   }
   cv::addWeighted(im, 1.0 - weight, vis_img, weight, 0, vis_img);
diff --git a/scripts/android/build_android_aar.sh b/scripts/android/build_android_aar.sh
index f1e4178b7..8d072004e 100755
--- a/scripts/android/build_android_aar.sh
+++ b/scripts/android/build_android_aar.sh
@@ -4,7 +4,7 @@ set +x
 
 FASTDEPLOY_DIR=$(pwd)
 BUILT_PACKAGE_DIR=build/Android
-CXX_PACKAGE_PREFIX=fastdeploy-android-latest-dev-shared
+CXX_PACKAGE_PREFIX=fastdeploy-android-latest-shared-dev
 CXX_PACKAGE_NAME=${BUILT_PACKAGE_DIR}/${CXX_PACKAGE_PREFIX}
 ARMV8_CXX_PACKAGE_NAME=${BUILT_PACKAGE_DIR}/arm64-v8a-api-21/install
 ARMV7_CXX_PACKAGE_NAME=${BUILT_PACKAGE_DIR}/armeabi-v7a-api-21/install

From 6380aec3a6baefb88ca80e0060cebba4690dc221 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Mon, 12 Dec 2022 10:24:34 +0800
Subject: [PATCH 23/77] =?UTF-8?q?Update=20=E6=8A=A5=E5=91=8Aissue.md?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .github/ISSUE_TEMPLATE/报告issue.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.github/ISSUE_TEMPLATE/报告issue.md b/.github/ISSUE_TEMPLATE/报告issue.md
index 34085055f..0cec7b295 100644
--- a/.github/ISSUE_TEMPLATE/报告issue.md
+++ b/.github/ISSUE_TEMPLATE/报告issue.md
@@ -9,7 +9,8 @@ assignees: ''
 
 ## 环境
 
-- FastDeploy版本： 说明具体的版本，如fastdeploy-linux-gpu-0.8.0或自行编译的develop代码（附上自行编译的方式，及cmake时print的编译选项截图）
+- FastDeploy版本： 说明具体的版本，如fastdeploy-linux-gpu-0.8.0
+- 如果您是自行编译的FastDeploy，请说明您的编译方式（参数命令）
 - 系统平台: Linux x64(Ubuntu 18.04) / Windows x64(Windows10) / Mac OSX arm(12.0) / Mac OSX intel(12.0)
 - 硬件： 说明具体硬件型号，如 Nvidia GPU 3080TI， CUDA 11.2 CUDNN 8.3
 - 编译语言： C++ / Python(3.7或3.8等）

From af4c28d4ae1bc071940b2f15388246a2382f2007 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Mon, 12 Dec 2022 10:26:35 +0800
Subject: [PATCH 24/77] =?UTF-8?q?Update=20=E6=8A=A5=E5=91=8Aissue.md?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .github/ISSUE_TEMPLATE/报告issue.md | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/.github/ISSUE_TEMPLATE/报告issue.md b/.github/ISSUE_TEMPLATE/报告issue.md
index 0cec7b295..7cc400ace 100644
--- a/.github/ISSUE_TEMPLATE/报告issue.md
+++ b/.github/ISSUE_TEMPLATE/报告issue.md
@@ -24,3 +24,8 @@ assignees: ''
 - - 先执行`examples`下的部署示例，包括使用examples提供的模型，确认是否可以正确执行
 - - 如若`examples`下的代码可以运行，但自己的模型，或自己的代码不能运行
 - - - 提供自己的代码使用方式或自己的模型，供工程师快速定位问题
+
+
+*********************************************
+请按照此issue模板进行提问，这会大大减少工程师与你确认使用环境，编译过程中的基础信息时间
+*********************************************

From 188dcedc026e8a6a7e426f8efbe1f503916b8c6f Mon Sep 17 00:00:00 2001
From: Zheng_Bicheng <58363586+Zheng-Bicheng@users.noreply.github.com>
Date: Mon, 12 Dec 2022 15:37:31 +0800
Subject: [PATCH 25/77] [RKNN2] Fix bugs (#851)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* 修复picodet格式

* * 修正错误文档
* 修复rknpu2 backend后端的部分错误
* 更新pphumanseg example格式

* * 更新pphumanseg example格式

* * 更新picodet example格式

* * 更新scrfd example格式

* * 更新ppseg rknpu2 python example中的错误

* * 修复代码格式问题

* * 修复代码格式问题

* * 修复代码格式问题

* * 修复代码格式问题

* * 修复代码格式问题

* * 修复代码格式问题

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 docs/cn/faq/rknpu2/rknpu2.md                  |  11 +-
 .../paddledetection/rknpu2/README.md          |   4 +-
 .../rknpu2/cpp/infer_picodet.cc               |  70 +++++++---
 .../vision/facedet/scrfd/rknpu2/cpp/infer.cc  | 120 +++++++++--------
 .../paddleseg/rknpu2/cpp/infer.cc             | 127 +++++++++---------
 .../paddleseg/rknpu2/python/infer.py          |   2 +-
 .../backends/rknpu/rknpu2/rknpu2_backend.cc   |   3 +
 .../vision/detection/contrib/rknpu2/model.h   |  15 ++-
 .../detection/contrib/rknpu2/postprocessor.cc |  64 +++------
 .../detection/contrib/rknpu2/postprocessor.h  |  14 +-
 .../detection/contrib/rknpu2/preprocessor.cc  |  32 ++---
 .../vision/detection/contrib/rknpu2/rkyolo.cc |  31 +++--
 .../vision/detection/contrib/rknpu2/utils.cc  |  64 ++++-----
 .../vision/detection/contrib/rknpu2/utils.h   |  13 +-
 14 files changed, 309 insertions(+), 261 deletions(-)

diff --git a/docs/cn/faq/rknpu2/rknpu2.md b/docs/cn/faq/rknpu2/rknpu2.md
index c488f311c..0e1f920d6 100644
--- a/docs/cn/faq/rknpu2/rknpu2.md
+++ b/docs/cn/faq/rknpu2/rknpu2.md
@@ -14,19 +14,18 @@ ONNX模型不能直接调用RK芯片中的NPU进行运算，需要把ONNX模型
 
 | 任务场景             | 模型                | 模型版本(表示已经测试的版本)               | ARM CPU/RKNN速度(ms) |
 |------------------|-------------------|-------------------------------|--------------------|
-| Detection        | Picodet           | Picodet-s                     | 599/136            |
+| Detection        | Picodet           | Picodet-s                     | 162/112            |
 | Segmentation     | Unet              | Unet-cityscapes               | -/-                |
-| Segmentation     | PP-LiteSeg        | PP_LiteSeg_T_STDC1_cityscapes | 6634/5598          |
-| Segmentation     | PP-HumanSegV2Lite | portrait                      | 456/266            |
-| Segmentation     | PP-HumanSegV2Lite | human                         | 496/256            |
-| Face Detection   | SCRFD             | SCRFD-2.5G-kps-640            | 963/142            |
+| Segmentation     | PP-LiteSeg        | PP_LiteSeg_T_STDC1_cityscapes | -/-                |
+| Segmentation     | PP-HumanSegV2Lite | portrait                      | 53/50              |
+| Segmentation     | PP-HumanSegV2Lite | human                         | 53/50              |
+| Face Detection   | SCRFD             | SCRFD-2.5G-kps-640            | 112/108            |
 
 ## TODO
 以下为TODO计划，表示还正在准备支持，但是还存在问题或还可以改进的模型。
 
 | 任务场景             | 模型      | 模型版本(表示已经测试的版本)     | ARM CPU/RKNN速度(ms) |
 |------------------|---------|---------------------|--------------------|
-| Detection        | Picodet | Picodet-s(int8)     | -/-                |
 | Detection        | PPYOLOE | PPYOLOE(int8)       | -/-                |
 | Detection        | YOLOv5  | YOLOv5-s_v6.2(int8) | -/-                |
 | Face Recognition | ArcFace | ArcFace_r18         | 600/3              |
diff --git a/examples/vision/detection/paddledetection/rknpu2/README.md b/examples/vision/detection/paddledetection/rknpu2/README.md
index 98f1ada10..d242cf339 100644
--- a/examples/vision/detection/paddledetection/rknpu2/README.md
+++ b/examples/vision/detection/paddledetection/rknpu2/README.md
@@ -45,8 +45,8 @@ model_path: ./picodet_s_416_coco_lcnet/picodet_s_416_coco_lcnet.onnx
 output_folder: ./picodet_s_416_coco_lcnet
 target_platform: RK3568
 normalize:
-  mean: [[0.485,0.456,0.406],[0,0,0]]
-  std: [[0.229,0.224,0.225],[0.003921,0.003921]]
+  mean: [[0.485,0.456,0.406]]
+  std: [[0.229,0.224,0.225]]
 outputs: ['tmp_17','p2o.Concat.9']
 ```
 
diff --git a/examples/vision/detection/paddledetection/rknpu2/cpp/infer_picodet.cc b/examples/vision/detection/paddledetection/rknpu2/cpp/infer_picodet.cc
index 12f405b52..8535aa338 100644
--- a/examples/vision/detection/paddledetection/rknpu2/cpp/infer_picodet.cc
+++ b/examples/vision/detection/paddledetection/rknpu2/cpp/infer_picodet.cc
@@ -15,26 +15,39 @@
 #include <string>
 #include "fastdeploy/vision.h"
 #include <sys/time.h>
-double __get_us(struct timeval t) { return (t.tv_sec * 1000000 + t.tv_usec); }
-void InferPicodet(const std::string& model_dir, const std::string& image_file);
 
-int main(int argc, char* argv[]) {
-  if (argc < 3) {
-    std::cout
-        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
-           "e.g ./infer_model ./picodet_model_dir ./test.jpeg"
-        << std::endl;
-    return -1;
+void ONNXInfer(const std::string& model_dir, const std::string& image_file) {
+  std::string model_file = model_dir + "/picodet_s_416_coco_lcnet.onnx";
+  std::string params_file;
+  std::string config_file = model_dir + "/deploy.yaml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseCpu();
+  auto format = fastdeploy::ModelFormat::ONNX;
+
+  auto model = fastdeploy::vision::detection::PicoDet(
+      model_file, params_file, config_file,option,format);
+  model.GetPostprocessor().ApplyDecodeAndNMS();
+
+  fastdeploy::TimeCounter tc;
+  tc.Start();
+  auto im = cv::imread(image_file);
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
   }
+  auto vis_im = fastdeploy::vision::VisDetection(im, res,0.5);
+  tc.End();
+  tc.PrintInfo("PPDet in ONNX");
 
-  InferPicodet(argv[1], argv[2]);
-
-  return 0;
+  cv::imwrite("infer_onnx.jpg", vis_im);
+  std::cout
+      << "Visualized result saved in ./infer_onnx.jpg"
+      << std::endl;
 }
 
-void InferPicodet(const std::string& model_dir, const std::string& image_file) {
-  struct timeval start_time, stop_time;
-  auto model_file = model_dir + "/picodet_s_416_coco_lcnet_rk3568.rknn";
+void RKNPU2Infer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + "/picodet_s_416_coco_lcnet_rk3588.rknn";
   auto params_file = "";
   auto config_file = model_dir + "/infer_cfg.yml";
 
@@ -51,16 +64,31 @@ void InferPicodet(const std::string& model_dir, const std::string& image_file) {
   auto im = cv::imread(image_file);
 
   fastdeploy::vision::DetectionResult res;
-  gettimeofday(&start_time, NULL);
+  fastdeploy::TimeCounter tc;
+  tc.Start();
   if (!model.Predict(&im, &res)) {
     std::cerr << "Failed to predict." << std::endl;
     return;
   }
-  gettimeofday(&stop_time, NULL);
-  printf("infer use %f ms\n", (__get_us(stop_time) - __get_us(start_time)) / 1000);
+  tc.End();
+  tc.PrintInfo("PPDet in RKNPU2");
 
   std::cout << res.Str() << std::endl;
   auto vis_im = fastdeploy::vision::VisDetection(im, res,0.5);
-  cv::imwrite("picodet_result.jpg", vis_im);
-  std::cout << "Visualized result saved in ./picodet_result.jpg" << std::endl;
-}
\ No newline at end of file
+  cv::imwrite("infer_rknpu2.jpg", vis_im);
+  std::cout << "Visualized result saved in ./infer_rknpu2.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 3) {
+    std::cout
+        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
+           "e.g ./infer_model ./picodet_model_dir ./test.jpeg"
+        << std::endl;
+    return -1;
+  }
+  RKNPU2Infer(argv[1], argv[2]);
+//ONNXInfer(argv[1], argv[2]);
+  return 0;
+}
+
diff --git a/examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc b/examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc
index a01f1b184..4ac3496f5 100644
--- a/examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc
+++ b/examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc
@@ -2,50 +2,13 @@
 #include <string>
 #include "fastdeploy/vision.h"
 
-void InferScrfd(const std::string& device = "cpu");
-
-int main() {
-  InferScrfd("npu");
-  return 0;
-}
-
-fastdeploy::RuntimeOption GetOption(const std::string& device) {
-  auto option = fastdeploy::RuntimeOption();
-  if (device == "npu") {
-    option.UseRKNPU2();
-  } else {
-    option.UseCpu();
-  }
-  return option;
-}
-
-fastdeploy::ModelFormat GetFormat(const std::string& device) {
-  auto format = fastdeploy::ModelFormat::ONNX;
-  if (device == "npu") {
-    format = fastdeploy::ModelFormat::RKNN;
-  } else {
-    format = fastdeploy::ModelFormat::ONNX;
-  }
-  return format;
-}
-
-std::string GetModelPath(std::string& model_path, const std::string& device) {
-  if (device == "npu") {
-    model_path += "rknn";
-  } else {
-    model_path += "onnx";
-  }
-  return model_path;
-}
-
-void InferScrfd(const std::string& device) {
-  std::string model_file =
-      "./model/scrfd_500m_bnkps_shape640x640_rk3588.";
+void ONNXInfer(const std::string& model_dir, const std::string& image_file) {
+  std::string model_file = model_dir + "/scrfd_500m_bnkps_shape640x640.onnx";
   std::string params_file;
+  auto option = fastdeploy::RuntimeOption();
+  option.UseCpu();
+  auto format = fastdeploy::ModelFormat::ONNX;
 
-  fastdeploy::RuntimeOption option = GetOption(device);
-  fastdeploy::ModelFormat format = GetFormat(device);
-  model_file = GetModelPath(model_file, device);
   auto model = fastdeploy::vision::facedet::SCRFD(
       model_file, params_file, option, format);
 
@@ -53,27 +16,68 @@ void InferScrfd(const std::string& device) {
     std::cerr << "Failed to initialize." << std::endl;
     return;
   }
-  auto image_file =
-      "./images/test_lite_face_detector_3.jpg";
+
+  fastdeploy::TimeCounter tc;
+  tc.Start();
   auto im = cv::imread(image_file);
-
-  if (device == "npu") {
-    model.DisableNormalizeAndPermute();
-  }
-
   fastdeploy::vision::FaceDetectionResult res;
-  clock_t start = clock();
   if (!model.Predict(&im, &res)) {
     std::cerr << "Failed to predict." << std::endl;
     return;
   }
-  clock_t end = clock();
-  auto dur = static_cast<double>(end - start);
-  printf("InferScrfd use time:%f\n",
-         (dur / CLOCKS_PER_SEC));
-
-  std::cout << res.Str() << std::endl;
   auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im, res);
-  cv::imwrite("vis_result.jpg", vis_im);
-  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+  tc.End();
+  tc.PrintInfo("SCRFD in ONNX");
+
+  cv::imwrite("infer_onnx.jpg", vis_im);
+  std::cout
+      << "Visualized result saved in ./infer_onnx.jpg"
+      << std::endl;
+}
+
+void RKNPU2Infer(const std::string& model_dir, const std::string& image_file) {
+  std::string model_file = model_dir + "/scrfd_500m_bnkps_shape640x640_rk3588.rknn";
+  std::string params_file;
+  auto option = fastdeploy::RuntimeOption();
+  option.UseRKNPU2();
+  auto format = fastdeploy::ModelFormat::RKNN;
+
+  auto model = fastdeploy::vision::facedet::SCRFD(model_file, params_file, option, format);
+
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+  model.DisableNormalizeAndPermute();
+
+  fastdeploy::TimeCounter tc;
+  tc.Start();
+  auto im = cv::imread(image_file);
+  fastdeploy::vision::FaceDetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im, res);
+  tc.End();
+  tc.PrintInfo("SCRFD in RKNN");
+
+  cv::imwrite("infer_rknn.jpg", vis_im);
+  std::cout
+      << "Visualized result saved in ./infer_rknn.jpg"
+      << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 3) {
+    std::cout
+        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
+           "e.g ./infer_model ./picodet_model_dir ./test.jpeg"
+        << std::endl;
+    return -1;
+  }
+
+  RKNPU2Infer(argv[1], argv[2]);
+  ONNXInfer(argv[1], argv[2]);
+  return 0;
 }
\ No newline at end of file
diff --git a/examples/vision/segmentation/paddleseg/rknpu2/cpp/infer.cc b/examples/vision/segmentation/paddleseg/rknpu2/cpp/infer.cc
index bfc108d05..4e02ae32e 100644
--- a/examples/vision/segmentation/paddleseg/rknpu2/cpp/infer.cc
+++ b/examples/vision/segmentation/paddleseg/rknpu2/cpp/infer.cc
@@ -15,83 +15,84 @@
 #include <string>
 #include "fastdeploy/vision.h"
 
-void InferHumanPPHumansegv2Lite(const std::string& device = "cpu");
-
-int main() {
-  InferHumanPPHumansegv2Lite("npu");
-  return 0;
-}
-
-fastdeploy::RuntimeOption GetOption(const std::string& device) {
-  auto option = fastdeploy::RuntimeOption();
-  if (device == "npu") {
-    option.UseRKNPU2();
-  } else {
-    option.UseCpu();
-  }
-  return option;
-}
-
-fastdeploy::ModelFormat GetFormat(const std::string& device) {
-  auto format = fastdeploy::ModelFormat::ONNX;
-  if (device == "npu") {
-    format = fastdeploy::ModelFormat::RKNN;
-  } else {
-    format = fastdeploy::ModelFormat::ONNX;
-  }
-  return format;
-}
-
-std::string GetModelPath(std::string& model_path, const std::string& device) {
-  if (device == "npu") {
-    model_path += "rknn";
-  } else {
-    model_path += "onnx";
-  }
-  return model_path;
-}
-
-void InferHumanPPHumansegv2Lite(const std::string& device) {
-  std::string model_file =
-      "./model/Portrait_PP_HumanSegV2_Lite_256x144_infer/"
-      "Portrait_PP_HumanSegV2_Lite_256x144_infer_rk3588.";
+void ONNXInfer(const std::string& model_dir, const std::string& image_file) {
+  std::string model_file = model_dir + "/Portrait_PP_HumanSegV2_Lite_256x144_infer.onnx";
   std::string params_file;
-  std::string config_file =
-      "./model/Portrait_PP_HumanSegV2_Lite_256x144_infer/deploy.yaml";
+  std::string config_file = model_dir + "/deploy.yaml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseCpu();
+  auto format = fastdeploy::ModelFormat::ONNX;
 
-  fastdeploy::RuntimeOption option = GetOption(device);
-  fastdeploy::ModelFormat format = GetFormat(device);
-  model_file = GetModelPath(model_file, device);
   auto model = fastdeploy::vision::segmentation::PaddleSegModel(
       model_file, params_file, config_file, option, format);
-
   if (!model.Initialized()) {
     std::cerr << "Failed to initialize." << std::endl;
     return;
   }
-  auto image_file =
-      "./images/portrait_heng.jpg";
+
+  fastdeploy::TimeCounter tc;
+  tc.Start();
   auto im = cv::imread(image_file);
-
-  if (device == "npu") {
-    model.GetPreprocessor().DisableNormalizeAndPermute();
-  }
-
   fastdeploy::vision::SegmentationResult res;
-  clock_t start = clock();
   if (!model.Predict(im, &res)) {
     std::cerr << "Failed to predict." << std::endl;
     return;
   }
-  clock_t end = clock();
-  auto dur = (double)(end - start);
-  printf("infer_human_pp_humansegv2_lite_npu use time:%f\n",
-         (dur / CLOCKS_PER_SEC));
-
-  std::cout << res.Str() << std::endl;
   auto vis_im = fastdeploy::vision::VisSegmentation(im, res);
-  cv::imwrite("human_pp_humansegv2_lite_npu_result.jpg", vis_im);
+  tc.End();
+  tc.PrintInfo("PPSeg in ONNX");
+
+  cv::imwrite("infer_onnx.jpg", vis_im);
   std::cout
-      << "Visualized result saved in ./human_pp_humansegv2_lite_npu_result.jpg"
+      << "Visualized result saved in ./infer_onnx.jpg"
       << std::endl;
-}
\ No newline at end of file
+}
+
+void RKNPU2Infer(const std::string& model_dir, const std::string& image_file) {
+  std::string model_file = model_dir + "/Portrait_PP_HumanSegV2_Lite_256x144_infer_rk3588.rknn";
+  std::string params_file;
+  std::string config_file = model_dir + "/deploy.yaml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseRKNPU2();
+  auto format = fastdeploy::ModelFormat::RKNN;
+
+  auto model = fastdeploy::vision::segmentation::PaddleSegModel(
+      model_file, params_file, config_file, option, format);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+  model.GetPreprocessor().DisableNormalizeAndPermute();
+
+  fastdeploy::TimeCounter tc;
+  tc.Start();
+  auto im = cv::imread(image_file);
+  fastdeploy::vision::SegmentationResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  auto vis_im = fastdeploy::vision::VisSegmentation(im, res);
+  tc.End();
+  tc.PrintInfo("PPSeg in RKNPU2");
+
+  cv::imwrite("infer_rknn.jpg", vis_im);
+  std::cout
+      << "Visualized result saved in ./infer_rknn.jpg"
+      << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 3) {
+    std::cout
+        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
+           "e.g ./infer_model ./picodet_model_dir ./test.jpeg"
+        << std::endl;
+    return -1;
+  }
+
+  RKNPU2Infer(argv[1], argv[2]);
+  ONNXInfer(argv[1], argv[2]);
+  return 0;
+}
+
diff --git a/examples/vision/segmentation/paddleseg/rknpu2/python/infer.py b/examples/vision/segmentation/paddleseg/rknpu2/python/infer.py
index d7239eb42..4168d591d 100644
--- a/examples/vision/segmentation/paddleseg/rknpu2/python/infer.py
+++ b/examples/vision/segmentation/paddleseg/rknpu2/python/infer.py
@@ -49,7 +49,7 @@ model = fd.vision.segmentation.PaddleSegModel(
     runtime_option=runtime_option,
     model_format=fd.ModelFormat.RKNN)
 
-model.disable_normalize_and_permute()
+model.preprocessor.disable_normalize_and_permute()
 
 # 预测图片分割结果
 im = cv2.imread(args.image)
diff --git a/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc b/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
index b577c2791..8046fd87a 100644
--- a/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
+++ b/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
@@ -345,6 +345,9 @@ bool RKNPU2Backend::Infer(std::vector<FDTensor>& inputs,
         FDERROR << "rknn_create_mem output_mems_ error." << std::endl;
         return false;
       }
+      if(output_attrs_[i].type == RKNN_TENSOR_FLOAT16){
+        output_attrs_[i].type = RKNN_TENSOR_FLOAT32;
+      }
       // default output type is depend on model, this requires float32 to compute top5
       ret = rknn_set_io_mem(ctx, output_mems_[i], &output_attrs_[i]);
       // set output memory and attribute
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/model.h b/fastdeploy/vision/detection/contrib/rknpu2/model.h
index 9a0fd423d..8fe036cb5 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/model.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/model.h
@@ -35,7 +35,10 @@ class FASTDEPLOY_DECL RKYOLOV5 : public RKYOLO {
     valid_cpu_backends = {};
     valid_gpu_backends = {};
     valid_rknpu_backends = {Backend::RKNPU2};
-    GetPostprocessor().SetModelType(ModelType::RKYOLOV5);
+    std::vector<int> anchors = {10, 13, 16,  30,  33, 23,  30,  61,  62,
+                                45, 59, 119, 116, 90, 156, 198, 373, 326};
+    int anchor_per_branch_ = 3;
+    GetPostprocessor().SetAnchor(anchors, anchor_per_branch_);
   }
 
   virtual std::string ModelName() const { return "RKYOLOV5"; }
@@ -58,7 +61,10 @@ class FASTDEPLOY_DECL RKYOLOV7 : public RKYOLO {
     valid_cpu_backends = {};
     valid_gpu_backends = {};
     valid_rknpu_backends = {Backend::RKNPU2};
-    GetPostprocessor().SetModelType(ModelType::RKYOLOV7);
+    std::vector<int> anchors = {12, 16, 19,  36,  40,  28,  36,  75,  76,
+                                55, 72, 146, 142, 110, 192, 243, 459, 401};
+    int anchor_per_branch_ = 3;
+    GetPostprocessor().SetAnchor(anchors, anchor_per_branch_);
   }
 
   virtual std::string ModelName() const { return "RKYOLOV7"; }
@@ -81,7 +87,10 @@ class FASTDEPLOY_DECL RKYOLOX : public RKYOLO {
     valid_cpu_backends = {};
     valid_gpu_backends = {};
     valid_rknpu_backends = {Backend::RKNPU2};
-    GetPostprocessor().SetModelType(ModelType::RKYOLOX);
+    std::vector<int> anchors = {10, 13, 16,  30,  33, 23,  30,  61,  62,
+                                45, 59, 119, 116, 90, 156, 198, 373, 326};
+    int anchor_per_branch_ = 1;
+    GetPostprocessor().SetAnchor(anchors, anchor_per_branch_);
   }
 
   virtual std::string ModelName() const { return "RKYOLOV7"; }
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
index bb46eff5c..bf8be2727 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
@@ -21,32 +21,8 @@ namespace detection {
 
 RKYOLOPostprocessor::RKYOLOPostprocessor() {}
 
-void RKYOLOPostprocessor::SetModelType(ModelType model_type) {
-  model_type_ = model_type;
-  if (model_type == RKYOLOV5) {
-    anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
-                45, 59, 119, 116, 90, 156, 198, 373, 326};
-    anchor_per_branch_ = 3;
-  } else if (model_type == RKYOLOX) {
-    anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
-                45, 59, 119, 116, 90, 156, 198, 373, 326};
-    anchor_per_branch_ = 1;
-  } else if (model_type == RKYOLOV7) {
-    anchors_ = {12, 16, 19,  36,  40,  28,  36,  75,  76,
-                55, 72, 146, 142, 110, 192, 243, 459, 401};
-    anchor_per_branch_ = 3;
-  } else {
-    return;
-  }
-}
-
 bool RKYOLOPostprocessor::Run(const std::vector<FDTensor>& tensors,
                               std::vector<DetectionResult>* results) {
-  if (model_type_ == ModelType::UNKNOWN) {
-    FDERROR << "RKYOLO Only Support YOLOV5,YOLOV7,YOLOX" << std::endl;
-    return false;
-  }
-
   results->resize(tensors[0].shape[0]);
   for (int num = 0; num < tensors[0].shape[0]; ++num) {
     int validCount = 0;
@@ -62,13 +38,15 @@ bool RKYOLOPostprocessor::Run(const std::vector<FDTensor>& tensors,
       int grid_h = height_ / stride;
       int grid_w = width_ / stride;
       int* anchor = &(anchors_.data()[i * 2 * anchor_per_branch_]);
-      if (tensors[i].dtype == FDDataType::INT8 || tensors[i].dtype == FDDataType::UINT8) {
+      if (tensors[i].dtype == FDDataType::INT8 ||
+          tensors[i].dtype == FDDataType::UINT8) {
         auto quantization_info = tensors[i].GetQuantizationInfo();
-        validCount = validCount +
-                     ProcessInt8((int8_t*)tensors[i].Data() + skip_address,
-                                 anchor, grid_h, grid_w, stride, filterBoxes,
-                                 boxesScore, classId, conf_threshold_,
-                                 quantization_info.first, quantization_info.second[0]);
+        validCount =
+            validCount + ProcessInt8((int8_t*)tensors[i].Data() + skip_address,
+                                     anchor, grid_h, grid_w, stride,
+                                     filterBoxes, boxesScore, classId,
+                                     conf_threshold_, quantization_info.first,
+                                     quantization_info.second[0]);
       } else {
         FDERROR << "RKYOLO Only Support INT8 Model" << std::endl;
       }
@@ -87,10 +65,13 @@ bool RKYOLOPostprocessor::Run(const std::vector<FDTensor>& tensors,
 
     QuickSortIndiceInverse(boxesScore, 0, validCount - 1, indexArray);
 
-    if (model_type_ == RKYOLOV5 || model_type_ == RKYOLOV7) {
+    if (anchor_per_branch_ == 3) {
       NMS(validCount, filterBoxes, classId, indexArray, nms_threshold_, false);
-    } else if (model_type_ == RKYOLOX) {
+    } else if (anchor_per_branch_ == 1) {
       NMS(validCount, filterBoxes, classId, indexArray, nms_threshold_, true);
+    }else{
+      FDERROR << "anchor_per_branch_ only support 3 or 1." << std::endl;
+      return false;
     }
 
     int last_count = 0;
@@ -110,19 +91,18 @@ bool RKYOLOPostprocessor::Run(const std::vector<FDTensor>& tensors,
       float y2 = y1 + filterBoxes[n * 4 + 3];
       int id = classId[n];
       (*results)[num].boxes.emplace_back(std::array<float, 4>{
-          (float)((clamp(x1, 0, width_) - pad_hw_values_[num][1] / 2) /
+          (float)((Clamp(x1, 0, width_) - pad_hw_values_[num][1] / 2) /
                   scale_[num]),
-          (float)((clamp(y1, 0, height_) - pad_hw_values_[num][0] / 2) /
+          (float)((Clamp(y1, 0, height_) - pad_hw_values_[num][0] / 2) /
                   scale_[num]),
-          (float)((clamp(x2, 0, width_) - pad_hw_values_[num][1] / 2) /
+          (float)((Clamp(x2, 0, width_) - pad_hw_values_[num][1] / 2) /
                   scale_[num]),
-          (float)((clamp(y2, 0, height_) - pad_hw_values_[num][0] / 2) /
+          (float)((Clamp(y2, 0, height_) - pad_hw_values_[num][0] / 2) /
                   scale_[0])});
       (*results)[num].label_ids.push_back(id);
       (*results)[num].scores.push_back(boxesScore[i]);
       last_count++;
     }
-    std::cout << "last_count" << last_count << std::endl;
   }
   return true;
 }
@@ -159,7 +139,7 @@ int RKYOLOPostprocessor::ProcessInt8(int8_t* input, int* anchor, int grid_h,
           float box_conf_f32 = DeqntAffineToF32(box_confidence, zp, scale);
           float class_prob_f32 = DeqntAffineToF32(maxClassProbs, zp, scale);
           float limit_score = 0;
-          if (model_type_ == RKYOLOX) {
+          if (anchor_per_branch_ == 1) {
             limit_score = box_conf_f32 * class_prob_f32;
           } else {
             limit_score = class_prob_f32;
@@ -167,7 +147,7 @@ int RKYOLOPostprocessor::ProcessInt8(int8_t* input, int* anchor, int grid_h,
           //printf("limit score: %f\n", limit_score);
           if (limit_score > conf_threshold_) {
             float box_x, box_y, box_w, box_h;
-            if (model_type_ == RKYOLOX) {
+            if (anchor_per_branch_ == 1) {
               box_x = DeqntAffineToF32(*in_ptr, zp, scale);
               box_y = DeqntAffineToF32(in_ptr[grid_len], zp, scale);
               box_w = DeqntAffineToF32(in_ptr[2 * grid_len], zp, scale);
@@ -234,6 +214,6 @@ int RKYOLOPostprocessor::QuickSortIndiceInverse(std::vector<float>& input,
   return low;
 }
 
-} // namespace detection
-} // namespace vision
-} // namespace fastdeploy
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
index 0332b2efd..238c1c465 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
@@ -13,6 +13,7 @@
 // limitations under the License.
 
 #pragma once
+
 #include "fastdeploy/vision/common/processors/transform.h"
 #include "fastdeploy/vision/common/result.h"
 #include "fastdeploy/vision/detection/contrib/rknpu2/utils.h"
@@ -54,9 +55,6 @@ class FASTDEPLOY_DECL RKYOLOPostprocessor {
   /// Get nms_threshold, default 0.45
   float GetNMSThreshold() const { return nms_threshold_; }
 
-  // Set model_type
-  void SetModelType(ModelType model_type);
-
   // Set height and weight
   void SetHeightAndWeight(int& height, int& width) {
     height_ = height;
@@ -69,10 +67,16 @@ class FASTDEPLOY_DECL RKYOLOPostprocessor {
   }
 
   // Set scale
-  void SetScale(std::vector<float> scale) { scale_ = scale; }
+  void SetScale(std::vector<float> scale) {
+    scale_ = scale;
+  }
 
+  // Set Anchor
+  void SetAnchor(std::vector<int> anchors,int anchor_per_branch){
+      anchors_ = anchors;
+      anchor_per_branch_ = anchor_per_branch;
+  };
  private:
-  ModelType model_type_ = ModelType::UNKNOWN;
   std::vector<int> anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
                                45, 59, 119, 116, 90, 156, 198, 373, 326};
   int strides_[3] = {8, 16, 32};
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
index 29480459b..068004346 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
+++ b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
@@ -57,7 +57,7 @@ void RKYOLOPreprocessor::LetterBox(FDMat* mat) {
     resize_w = size_[0];
   }
 
-  pad_hw_values_.push_back({pad_h,pad_w});
+  pad_hw_values_.push_back({pad_h, pad_w});
 
   if (std::fabs(scale - 1.0f) > 1e-06) {
     Resize::Run(mat, resize_w, resize_h);
@@ -75,17 +75,17 @@ void RKYOLOPreprocessor::LetterBox(FDMat* mat) {
 
 bool RKYOLOPreprocessor::Preprocess(FDMat* mat, FDTensor* output) {
   // process after image load
-//  float ratio = std::min(size_[1] * 1.0f / static_cast<float>(mat->Height()),
-//                         size_[0] * 1.0f / static_cast<float>(mat->Width()));
-//  if (std::fabs(ratio - 1.0f) > 1e-06) {
-//    int interp = cv::INTER_AREA;
-//    if (ratio > 1.0) {
-//      interp = cv::INTER_LINEAR;
-//    }
-//    int resize_h = int(mat->Height() * ratio);
-//    int resize_w = int(mat->Width() * ratio);
-//    Resize::Run(mat, resize_w, resize_h, -1, -1, interp);
-//  }
+  //  float ratio = std::min(size_[1] * 1.0f / static_cast<float>(mat->Height()),
+  //                         size_[0] * 1.0f / static_cast<float>(mat->Width()));
+  //  if (std::fabs(ratio - 1.0f) > 1e-06) {
+  //    int interp = cv::INTER_AREA;
+  //    if (ratio > 1.0) {
+  //      interp = cv::INTER_LINEAR;
+  //    }
+  //    int resize_h = int(mat->Height() * ratio);
+  //    int resize_w = int(mat->Width() * ratio);
+  //    Resize::Run(mat, resize_w, resize_h, -1, -1, interp);
+  //  }
 
   // RKYOLO's preprocess steps
   // 1. letterbox
@@ -93,7 +93,7 @@ bool RKYOLOPreprocessor::Preprocess(FDMat* mat, FDTensor* output) {
   LetterBox(mat);
   BGR2RGB::Run(mat);
   mat->ShareWithTensor(output);
-  output->ExpandDim(0); // reshape to n, h, w, c
+  output->ExpandDim(0);  // reshape to n, h, w, c
   return true;
 }
 
@@ -122,6 +122,6 @@ bool RKYOLOPreprocessor::Run(std::vector<FDMat>* images,
   return true;
 }
 
-} // namespace detection
-} // namespace vision
-} // namespace fastdeploy
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
index 017cb1be3..524afcef1 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
+++ b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
@@ -1,3 +1,16 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.  //NOLINT
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
 #include "fastdeploy/vision/detection/contrib/rknpu2/rkyolo.h"
 
 namespace fastdeploy {
@@ -26,12 +39,11 @@ bool RKYOLO::Initialize() {
     return false;
   }
   auto size = GetPreprocessor().GetSize();
-  GetPostprocessor().SetHeightAndWeight(size[0],size[1]);
+  GetPostprocessor().SetHeightAndWeight(size[0], size[1]);
   return true;
 }
 
-bool RKYOLO::Predict(const cv::Mat& im,
-                     DetectionResult* result) {
+bool RKYOLO::Predict(const cv::Mat& im, DetectionResult* result) {
   std::vector<DetectionResult> results;
   if (!BatchPredict({im}, &results)) {
     return false;
@@ -50,7 +62,8 @@ bool RKYOLO::BatchPredict(const std::vector<cv::Mat>& images,
   }
   auto pad_hw_values_ = preprocessor_.GetPadHWValues();
   postprocessor_.SetPadHWValues(preprocessor_.GetPadHWValues());
-  std::cout << "preprocessor_ scale_ = " << preprocessor_.GetScale()[0] << std::endl;
+  std::cout << "preprocessor_ scale_ = " << preprocessor_.GetScale()[0]
+            << std::endl;
   postprocessor_.SetScale(preprocessor_.GetScale());
 
   reused_input_tensors_[0].name = InputInfoOfRuntime(0).name;
@@ -59,15 +72,15 @@ bool RKYOLO::BatchPredict(const std::vector<cv::Mat>& images,
     return false;
   }
 
-
   if (!postprocessor_.Run(reused_output_tensors_, results)) {
-    FDERROR << "Failed to postprocess the inference results by runtime." << std::endl;
+    FDERROR << "Failed to postprocess the inference results by runtime."
+            << std::endl;
     return false;
   }
 
   return true;
 }
 
-} // namespace detection
-} // namespace vision
-} // namespace fastdeploy
\ No newline at end of file
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
\ No newline at end of file
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/utils.cc b/fastdeploy/vision/detection/contrib/rknpu2/utils.cc
index faac26983..4271def4a 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/utils.cc
+++ b/fastdeploy/vision/detection/contrib/rknpu2/utils.cc
@@ -12,7 +12,10 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 #include "fastdeploy/vision/detection/contrib/rknpu2/utils.h"
-float clamp(float val, int min, int max) {
+namespace fastdeploy {
+namespace vision {
+namespace detection {
+float Clamp(float val, int min, int max) {
   return val > min ? (val < max ? val : max) : min;
 }
 
@@ -35,59 +38,56 @@ float DeqntAffineToF32(int8_t qnt, int32_t zp, float scale) {
   return ((float)qnt - (float)zp) * scale;
 }
 
-static float CalculateOverlap(float xmin0, float ymin0, float xmax0, float ymax0, float xmin1, float ymin1, float xmax1, float ymax1)
-{
+static float CalculateOverlap(float xmin0, float ymin0, float xmax0,
+                              float ymax0, float xmin1, float ymin1,
+                              float xmax1, float ymax1) {
   float w = fmax(0.f, fmin(xmax0, xmax1) - fmax(xmin0, xmin1) + 1.0);
   float h = fmax(0.f, fmin(ymax0, ymax1) - fmax(ymin0, ymin1) + 1.0);
   float i = w * h;
-  float u = (xmax0 - xmin0 + 1.0) * (ymax0 - ymin0 + 1.0) + (xmax1 - xmin1 + 1.0) * (ymax1 - ymin1 + 1.0) - i;
+  float u = (xmax0 - xmin0 + 1.0) * (ymax0 - ymin0 + 1.0) +
+            (xmax1 - xmin1 + 1.0) * (ymax1 - ymin1 + 1.0) - i;
   return u <= 0.f ? 0.f : (i / u);
 }
 
-int NMS(int validCount,
-        std::vector<float> &outputLocations,
-        std::vector<int> &class_id,
-        std::vector<int> &order,
-        float threshold,
-        bool class_agnostic)
-{
+int NMS(int valid_count, std::vector<float>& output_locations,
+        std::vector<int>& class_id, std::vector<int>& order, float threshold,
+        bool class_agnostic) {
   // printf("class_agnostic: %d\n", class_agnostic);
-  for (int i = 0; i < validCount; ++i)
-  {
-    if (order[i] == -1)
-    {
+  for (int i = 0; i < valid_count; ++i) {
+    if (order[i] == -1) {
       continue;
     }
     int n = order[i];
-    for (int j = i + 1; j < validCount; ++j)
-    {
+    for (int j = i + 1; j < valid_count; ++j) {
       int m = order[j];
-      if (m == -1)
-      {
+      if (m == -1) {
         continue;
       }
 
-      if (!class_agnostic && class_id[n] != class_id[m]){
+      if (!class_agnostic && class_id[n] != class_id[m]) {
         continue;
       }
 
-      float xmin0 = outputLocations[n * 4 + 0];
-      float ymin0 = outputLocations[n * 4 + 1];
-      float xmax0 = outputLocations[n * 4 + 0] + outputLocations[n * 4 + 2];
-      float ymax0 = outputLocations[n * 4 + 1] + outputLocations[n * 4 + 3];
+      float xmin0 = output_locations[n * 4 + 0];
+      float ymin0 = output_locations[n * 4 + 1];
+      float xmax0 = output_locations[n * 4 + 0] + output_locations[n * 4 + 2];
+      float ymax0 = output_locations[n * 4 + 1] + output_locations[n * 4 + 3];
 
-      float xmin1 = outputLocations[m * 4 + 0];
-      float ymin1 = outputLocations[m * 4 + 1];
-      float xmax1 = outputLocations[m * 4 + 0] + outputLocations[m * 4 + 2];
-      float ymax1 = outputLocations[m * 4 + 1] + outputLocations[m * 4 + 3];
+      float xmin1 = output_locations[m * 4 + 0];
+      float ymin1 = output_locations[m * 4 + 1];
+      float xmax1 = output_locations[m * 4 + 0] + output_locations[m * 4 + 2];
+      float ymax1 = output_locations[m * 4 + 1] + output_locations[m * 4 + 3];
 
-      float iou = CalculateOverlap(xmin0, ymin0, xmax0, ymax0, xmin1, ymin1, xmax1, ymax1);
+      float iou = CalculateOverlap(xmin0, ymin0, xmax0, ymax0, xmin1, ymin1,
+                                   xmax1, ymax1);
 
-      if (iou > threshold)
-      {
+      if (iou > threshold) {
         order[j] = -1;
       }
     }
   }
   return 0;
-}
\ No newline at end of file
+}
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
\ No newline at end of file
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/utils.h b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
index 4414cb8a5..23efa25c8 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/utils.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
@@ -14,13 +14,20 @@
 #pragma once
 #include <cmath>
 #include <vector>
-typedef enum { RKYOLOX = 0, RKYOLOV5, RKYOLOV7, UNKNOWN } ModelType;
-float clamp(float val, int min, int max);
+
+namespace fastdeploy {
+namespace vision {
+namespace detection {
+float Clamp(float val, int min, int max);
 float Sigmoid(float x);
 float UnSigmoid(float y);
 inline static int32_t __clip(float val, float min, float max);
 int8_t QntF32ToAffine(float f32, int32_t zp, float scale);
 float DeqntAffineToF32(int8_t qnt, int32_t zp, float scale);
-int NMS(int validCount, std::vector<float>& outputLocations,
+int NMS(int valid_count, std::vector<float>& output_locations,
         std::vector<int>& class_id, std::vector<int>& order, float threshold,
         bool class_agnostic);
+
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
\ No newline at end of file

From 7415552cb2d7001fa0c5d69a12b6a1181395a989 Mon Sep 17 00:00:00 2001
From: WJJ1995 <wjjisloser@163.com>
Date: Mon, 12 Dec 2022 18:34:52 +0800
Subject: [PATCH 26/77] [Benchmark] Fixed benchmark_ppocr.py (#859)

* add onnx_ort_runtime demo

* rm in requirements

* support batch eval

* fixed MattingResults bug

* move assignment for DetectionResult

* integrated x2paddle

* add model convert readme

* update readme

* re-lint

* add processor api

* Add MattingResult Free

* change valid_cpu_backends order

* add ppocr benchmark

* mv bs from 64 to 32

* fixed quantize.md

* fixed quantize bugs

* Add Monitor for benchmark

* update mem monitor

* Set trt_max_batch_size default 1

* fixed ocr benchmark bug

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 benchmark/benchmark_ppocr.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/benchmark/benchmark_ppocr.py b/benchmark/benchmark_ppocr.py
index 885f9a5a5..2de86be68 100644
--- a/benchmark/benchmark_ppocr.py
+++ b/benchmark/benchmark_ppocr.py
@@ -92,6 +92,7 @@ def build_option(args):
         elif backend in ["trt", "paddle_trt"]:
             option.use_trt_backend()
             if backend == "paddle_trt":
+                option.enable_paddle_trt_collect_shape()
                 option.enable_paddle_to_trt()
             if enable_trt_fp16:
                 option.enable_trt_fp16()
@@ -267,7 +268,6 @@ if __name__ == '__main__':
     f.writelines("===={}====: \n".format(os.path.split(file_path)[-1][:-4]))
 
     try:
-        rec_option = option
         if "OCRv2" in args.model_dir:
             det_option = option
             if args.backend in ["trt", "paddle_trt"]:
@@ -293,16 +293,19 @@ if __name__ == '__main__':
             model = fd.vision.ocr.PPOCRv2(
                 det_model=det_model, cls_model=cls_model, rec_model=rec_model)
         elif "OCRv3" in args.model_dir:
+            det_option = option
             if args.backend in ["trt", "paddle_trt"]:
                 det_option.set_trt_input_shape(
                     "x", [1, 3, 64, 64], [1, 3, 640, 640], [1, 3, 960, 960])
             det_model = fd.vision.ocr.DBDetector(
                 det_model_file, det_params_file, runtime_option=det_option)
+            cls_option = option
             if args.backend in ["trt", "paddle_trt"]:
                 cls_option.set_trt_input_shape(
                     "x", [1, 3, 48, 10], [10, 3, 48, 320], [64, 3, 48, 1024])
             cls_model = fd.vision.ocr.Classifier(
                 cls_model_file, cls_params_file, runtime_option=cls_option)
+            rec_option = option
             if args.backend in ["trt", "paddle_trt"]:
                 rec_option.set_trt_input_shape(
                     "x", [1, 3, 48, 10], [10, 3, 48, 320], [64, 3, 48, 2304])

From 5fc6cf30dfa66231ae1f43aa8d19991dcc81fa2d Mon Sep 17 00:00:00 2001
From: yunyaoXYY <109218879+yunyaoXYY@users.noreply.github.com>
Date: Tue, 13 Dec 2022 10:21:44 +0800
Subject: [PATCH 27/77] [Quantization] Add new PaddleClas models quantization
 support. (#864)

* Fix links in readme

* Fix links in readme

* Update PPOCRv2/v3 examples

* Update auto compression configs

* Add neww quantization  support for paddleclas model

* Update quantized Yolov6s model download link
---
 .../detection/yolov6/quantize/cpp/README.md   |  2 +-
 .../yolov6/quantize/python/README.md          |  2 +-
 tools/common_tools/auto_compression/README.md |  5 ++
 .../auto_compression/README_EN.md             |  4 ++
 .../classification/efficientnetb0_quant.yaml  | 50 +++++++++++++++++++
 .../mobilenetv3_large_x1_0_quant.yaml         | 46 +++++++++++++++++
 .../classification/pphgnet_tiny_quant.yaml    | 50 +++++++++++++++++++
 .../classification/pplcnetv2_base_quant.yaml  | 50 +++++++++++++++++++
 8 files changed, 207 insertions(+), 2 deletions(-)
 create mode 100644 tools/common_tools/auto_compression/configs/classification/efficientnetb0_quant.yaml
 create mode 100644 tools/common_tools/auto_compression/configs/classification/mobilenetv3_large_x1_0_quant.yaml
 create mode 100644 tools/common_tools/auto_compression/configs/classification/pphgnet_tiny_quant.yaml
 create mode 100644 tools/common_tools/auto_compression/configs/classification/pplcnetv2_base_quant.yaml

diff --git a/examples/vision/detection/yolov6/quantize/cpp/README.md b/examples/vision/detection/yolov6/quantize/cpp/README.md
index 7ad762100..a929f8ced 100755
--- a/examples/vision/detection/yolov6/quantize/cpp/README.md
+++ b/examples/vision/detection/yolov6/quantize/cpp/README.md
@@ -23,7 +23,7 @@ cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
 make -j
 
 #下载FastDeloy提供的yolov6s量化模型文件和测试图片
-wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov6s_qat_model.tar
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov6s_qat_model_new.tar
 tar -xvf yolov6s_qat_model.tar
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
diff --git a/examples/vision/detection/yolov6/quantize/python/README.md b/examples/vision/detection/yolov6/quantize/python/README.md
index 057e13f9a..e9b80bb6f 100755
--- a/examples/vision/detection/yolov6/quantize/python/README.md
+++ b/examples/vision/detection/yolov6/quantize/python/README.md
@@ -17,7 +17,7 @@ git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd examples/slim/yolov6/python
 
 #下载FastDeloy提供的yolov6s量化模型文件和测试图片
-wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov6s_qat_model.tar
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov6s_qat_model_new.tar
 tar -xvf yolov6s_qat_model.tar
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
diff --git a/tools/common_tools/auto_compression/README.md b/tools/common_tools/auto_compression/README.md
index 7c1b3feac..ed0717a42 100644
--- a/tools/common_tools/auto_compression/README.md
+++ b/tools/common_tools/auto_compression/README.md
@@ -99,6 +99,11 @@ FastDeploy目前为用户提供了多个模型的压缩[config](./configs/)文
 | -------------------- | ------------------------------------------------------------ |----------------------------------------- |
 | [mobilenetv1_ssld_quant](./configs/classification/mobilenetv1_ssld_quant.yaml)      | [mobilenetv1_ssld](https://bj.bcebos.com/paddlehub/fastdeploy/MobileNetV1_ssld_infer.tgz)           |           |
 | [resnet50_vd_quant](./configs/classification/resnet50_vd_quant.yaml)      |   [resnet50_vd](https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz)          |     |
+| [efficientnetb0_quant](./configs/classification/efficientnetb0_quant.yaml)      |   [efficientnetb0](https://bj.bcebos.com/paddlehub/fastdeploy/EfficientNetB0_small_infer.tgz)          |     |
+| [mobilenetv3_large_x1_0_quant](./configs/classification/mobilenetv3_large_x1_0_quant.yaml)      |   [mobilenetv3_large_x1_0](https://bj.bcebos.com/paddlehub/fastdeploy/MobileNetV3_large_x1_0_ssld_infer.tgz)          |     |
+| [pphgnet_tiny_quant](./configs/classification/pphgnet_tiny_quant.yaml)      |   [pphgnet_tiny](https://bj.bcebos.com/paddlehub/fastdeploy/PPHGNet_tiny_ssld_infer.tgz)          |     |
+| [pplcnetv2_base_quant](./configs/classification/pplcnetv2_base_quant.yaml)      |   [pplcnetv2_base](https://bj.bcebos.com/paddlehub/fastdeploy/PPLCNetV2_base_infer.tgz)          |     |
+
 | [yolov5s_quant](./configs/detection/yolov5s_quant.yaml)       |   [yolov5s](https://paddle-slim-models.bj.bcebos.com/act/yolov5s.onnx)         |     |
 | [yolov6s_quant](./configs/detection/yolov6s_quant.yaml)       |  [yolov6s](https://paddle-slim-models.bj.bcebos.com/act/yolov6s.onnx)          |     |
 | [yolov7_quant](./configs/detection/yolov7_quant.yaml)        | [yolov7](https://paddle-slim-models.bj.bcebos.com/act/yolov7.onnx)           |      |
diff --git a/tools/common_tools/auto_compression/README_EN.md b/tools/common_tools/auto_compression/README_EN.md
index fb1480819..c3b0cfee6 100644
--- a/tools/common_tools/auto_compression/README_EN.md
+++ b/tools/common_tools/auto_compression/README_EN.md
@@ -107,6 +107,10 @@ FastDeploy currently provides users with compression [config](./configs/) files
 | -------------------- | ------------------------------------------------------------ |----------------------------------------- |
 | [mobilenetv1_ssld_quant](./configs/classification/mobilenetv1_ssld_quant.yaml)      | [mobilenetv1_ssld](https://bj.bcebos.com/paddlehub/fastdeploy/MobileNetV1_ssld_infer.tgz)           |           |
 | [resnet50_vd_quant](./configs/classification/resnet50_vd_quant.yaml)      |   [resnet50_vd](https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz)          |     |
+| [efficientnetb0_quant](./configs/classification/efficientnetb0_quant.yaml)      |   [efficientnetb0](https://bj.bcebos.com/paddlehub/fastdeploy/EfficientNetB0_small_infer.tgz)          |     |
+| [mobilenetv3_large_x1_0_quant](./configs/classification/mobilenetv3_large_x1_0_quant.yaml)      |   [mobilenetv3_large_x1_0](https://bj.bcebos.com/paddlehub/fastdeploy/MobileNetV3_large_x1_0_ssld_infer.tgz)          |     |
+| [pphgnet_tiny_quant](./configs/classification/pphgnet_tiny_quant.yaml)      |   [pphgnet_tiny](https://bj.bcebos.com/paddlehub/fastdeploy/PPHGNet_tiny_ssld_infer.tgz)          |     |
+| [pplcnetv2_base_quant](./configs/classification/pplcnetv2_base_quant.yaml)      |   [pplcnetv2_base](https://bj.bcebos.com/paddlehub/fastdeploy/PPLCNetV2_base_infer.tgz)          |     |
 | [yolov5s_quant](./configs/detection/yolov5s_quant.yaml)       |   [yolov5s](https://paddle-slim-models.bj.bcebos.com/act/yolov5s.onnx)         |     |
 | [yolov6s_quant](./configs/detection/yolov6s_quant.yaml)       |  [yolov6s](https://paddle-slim-models.bj.bcebos.com/act/yolov6s.onnx)          |     |
 | [yolov7_quant](./configs/detection/yolov7_quant.yaml)        | [yolov7](https://paddle-slim-models.bj.bcebos.com/act/yolov7.onnx)           |      |
diff --git a/tools/common_tools/auto_compression/configs/classification/efficientnetb0_quant.yaml b/tools/common_tools/auto_compression/configs/classification/efficientnetb0_quant.yaml
new file mode 100644
index 000000000..4a502445e
--- /dev/null
+++ b/tools/common_tools/auto_compression/configs/classification/efficientnetb0_quant.yaml
@@ -0,0 +1,50 @@
+Global:
+  model_dir: ./EfficientNetB0_small_infer/
+  format: 'paddle'
+  model_filename: inference.pdmodel
+  params_filename: inference.pdiparams
+  qat_image_path: ./ImageNet_val_640
+  ptq_image_path: ./ImageNet_val_640
+  input_list: ['inputs']
+  qat_preprocess: cls_image_preprocess
+  ptq_preprocess: cls_image_preprocess
+  qat_batch_size: 32
+
+Distillation:
+  alpha: 1.0
+  loss: l2
+  node:
+  - softmax_0.tmp_0
+
+QuantAware:
+  use_pact: true
+  activation_bits: 8
+  is_full_quantize: false
+  onnx_format: True
+  activation_quantize_type: moving_average_abs_max
+  weight_quantize_type: channel_wise_abs_max
+  not_quant_pattern:
+  - skip_quant
+  quantize_op_types:
+  - conv2d
+  - depthwise_conv2d
+  - matmul
+  - matmul_v2
+  weight_bits: 8
+
+TrainConfig:
+  epochs: 1
+  eval_iter: 500
+  learning_rate:
+    type: CosineAnnealingDecay
+    learning_rate: 0.015
+    T_max: 8000
+  optimizer_builder:
+    optimizer:
+      type: Momentum
+    weight_decay: 0.00002
+  origin_metric: 0.7738
+
+PTQ:
+  calibration_method: 'avg'   # option: avg, abs_max, hist, KL, mse
+  skip_tensor_list: None
diff --git a/tools/common_tools/auto_compression/configs/classification/mobilenetv3_large_x1_0_quant.yaml b/tools/common_tools/auto_compression/configs/classification/mobilenetv3_large_x1_0_quant.yaml
new file mode 100644
index 000000000..3ee6c8d3b
--- /dev/null
+++ b/tools/common_tools/auto_compression/configs/classification/mobilenetv3_large_x1_0_quant.yaml
@@ -0,0 +1,46 @@
+Global:
+  model_dir: ./MobileNetV3_large_x1_0_ssld_infer/
+  format: 'paddle'
+  model_filename: inference.pdmodel
+  params_filename: inference.pdiparams
+  qat_image_path: ./ImageNet_val_640
+  ptq_image_path: ./ImageNet_val_640
+  input_list: ['inputs']
+  qat_preprocess: cls_image_preprocess
+  ptq_preprocess: cls_image_preprocess
+  qat_batch_size: 128
+
+
+Distillation:
+  alpha: 1.0
+  loss: soft_label
+
+QuantAware:
+  use_pact: true
+  activation_bits: 8
+  is_full_quantize: false
+  onnx_format: True
+  activation_quantize_type: moving_average_abs_max
+  weight_quantize_type: channel_wise_abs_max
+  not_quant_pattern:
+  - skip_quant
+  quantize_op_types:
+  - conv2d
+  - depthwise_conv2d
+  - matmul
+  - matmul_v2
+  weight_bits: 8
+
+TrainConfig:
+  epochs: 2
+  eval_iter: 5000
+  learning_rate: 0.001
+  optimizer_builder:
+    optimizer:
+      type: Momentum
+    weight_decay: 0.00002
+  origin_metric: 0.7896
+
+PTQ:
+  calibration_method: 'avg'   # option: avg, abs_max, hist, KL, mse
+  skip_tensor_list: None
diff --git a/tools/common_tools/auto_compression/configs/classification/pphgnet_tiny_quant.yaml b/tools/common_tools/auto_compression/configs/classification/pphgnet_tiny_quant.yaml
new file mode 100644
index 000000000..b282d6dde
--- /dev/null
+++ b/tools/common_tools/auto_compression/configs/classification/pphgnet_tiny_quant.yaml
@@ -0,0 +1,50 @@
+Global:
+  model_dir: ./PPHGNet_tiny_ssld_infer/
+  format: 'paddle'
+  model_filename: inference.pdmodel
+  params_filename: inference.pdiparams
+  qat_image_path: ./ImageNet_val_640
+  ptq_image_path: ./ImageNet_val_640
+  input_list: ['x']
+  qat_preprocess: cls_image_preprocess
+  ptq_preprocess: cls_image_preprocess
+  qat_batch_size: 32
+
+Distillation:
+  alpha: 1.0
+  loss: l2
+  node:
+  - softmax_1.tmp_0
+
+QuantAware:
+  use_pact: true
+  activation_bits: 8
+  is_full_quantize: false
+  onnx_format: True
+  activation_quantize_type: moving_average_abs_max
+  weight_quantize_type: channel_wise_abs_max
+  not_quant_pattern:
+  - skip_quant
+  quantize_op_types:
+  - conv2d
+  - depthwise_conv2d
+  - matmul
+  - matmul_v2
+  weight_bits: 8
+
+TrainConfig:
+  epochs: 1
+  eval_iter: 500
+  learning_rate:
+    type: CosineAnnealingDecay
+    learning_rate: 0.015
+    T_max: 8000
+  optimizer_builder:
+    optimizer:
+      type: Momentum
+    weight_decay: 0.00002
+  origin_metric: 0.7959
+
+PTQ:
+  calibration_method: 'avg'   # option: avg, abs_max, hist, KL, mse
+  skip_tensor_list: None
diff --git a/tools/common_tools/auto_compression/configs/classification/pplcnetv2_base_quant.yaml b/tools/common_tools/auto_compression/configs/classification/pplcnetv2_base_quant.yaml
new file mode 100644
index 000000000..7c81c3ce2
--- /dev/null
+++ b/tools/common_tools/auto_compression/configs/classification/pplcnetv2_base_quant.yaml
@@ -0,0 +1,50 @@
+Global:
+  model_dir: ./PPLCNetV2_base_infer/
+  format: 'paddle'
+  model_filename: inference.pdmodel
+  params_filename: inference.pdiparams
+  qat_image_path: ./ImageNet_val_640
+  ptq_image_path: ./ImageNet_val_640
+  input_list: ['x']
+  qat_preprocess: cls_image_preprocess
+  ptq_preprocess: cls_image_preprocess
+  qat_batch_size: 32
+
+Distillation:
+  alpha: 1.0
+  loss: l2
+  node:
+  - softmax_1.tmp_0
+
+QuantAware:
+  use_pact: true
+  activation_bits: 8
+  is_full_quantize: false
+  onnx_format: True
+  activation_quantize_type: moving_average_abs_max
+  weight_quantize_type: channel_wise_abs_max
+  not_quant_pattern:
+  - skip_quant
+  quantize_op_types:
+  - conv2d
+  - depthwise_conv2d
+  - matmul
+  - matmul_v2
+  weight_bits: 8
+
+TrainConfig:
+  epochs: 1
+  eval_iter: 500
+  learning_rate:
+    type: CosineAnnealingDecay
+    learning_rate: 0.015
+    T_max: 8000
+  optimizer_builder:
+    optimizer:
+      type: Momentum
+    weight_decay: 0.00002
+  origin_metric: 0.7704
+
+PTQ:
+  calibration_method: 'avg'   # option: avg, abs_max, hist, KL, mse
+  skip_tensor_list: None

From 534d5b8c8b6b6d70d84de3a48635016f407c0b11 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Tue, 13 Dec 2022 10:21:56 +0800
Subject: [PATCH 28/77] [Turorials] Add tutorials for intel gpu (#860)

* Add tutorials for intel gpu

* fix gflags dependency

* Update README_CN.md

* Update README.md

* Update README.md
---
 cmake/gflags.cmake                            |   5 +
 examples/CMakeLists.txt                       |  13 +--
 .../face_landmark_1000/cpp/CMakeLists.txt     |   8 +-
 .../face_landmark_1000/cpp/README.md          |   2 +-
 .../vision/facealign/pfld/cpp/CMakeLists.txt  |   7 +-
 examples/vision/facealign/pfld/cpp/README.md  |   2 +-
 .../facealign/pipnet/cpp/CMakeLists.txt       |   7 +-
 .../vision/headpose/fsanet/cpp/CMakeLists.txt |   7 +-
 examples/vision/headpose/fsanet/cpp/README.md |   2 +-
 tutorials/intel_gpu/README.md                 |  57 ++++++++++
 tutorials/intel_gpu/README_CN.md              |  54 ++++++++++
 tutorials/intel_gpu/cpp/CMakeLists.txt        |  20 ++++
 tutorials/intel_gpu/cpp/README.md             |  52 +++++++++
 tutorials/intel_gpu/cpp/README_CN.md          |  52 +++++++++
 tutorials/intel_gpu/cpp/infer_ppyoloe.cc      | 100 ++++++++++++++++++
 tutorials/intel_gpu/cpp/infer_resnet50.cc     | 100 ++++++++++++++++++
 tutorials/intel_gpu/python/README.md          |  38 +++++++
 tutorials/intel_gpu/python/README_CN.md       |  37 +++++++
 tutorials/intel_gpu/python/infer_ppyoloe.py   |  65 ++++++++++++
 tutorials/intel_gpu/python/infer_resnet50.py  |  61 +++++++++++
 20 files changed, 650 insertions(+), 39 deletions(-)
 create mode 100644 tutorials/intel_gpu/README.md
 create mode 100644 tutorials/intel_gpu/README_CN.md
 create mode 100644 tutorials/intel_gpu/cpp/CMakeLists.txt
 create mode 100644 tutorials/intel_gpu/cpp/README.md
 create mode 100644 tutorials/intel_gpu/cpp/README_CN.md
 create mode 100644 tutorials/intel_gpu/cpp/infer_ppyoloe.cc
 create mode 100644 tutorials/intel_gpu/cpp/infer_resnet50.cc
 create mode 100644 tutorials/intel_gpu/python/README.md
 create mode 100644 tutorials/intel_gpu/python/README_CN.md
 create mode 100644 tutorials/intel_gpu/python/infer_ppyoloe.py
 create mode 100644 tutorials/intel_gpu/python/infer_resnet50.py

diff --git a/cmake/gflags.cmake b/cmake/gflags.cmake
index 08d5e49c8..bf20cc2ab 100644
--- a/cmake/gflags.cmake
+++ b/cmake/gflags.cmake
@@ -107,11 +107,16 @@ ADD_LIBRARY(gflags STATIC IMPORTED GLOBAL)
 SET_PROPERTY(TARGET gflags PROPERTY IMPORTED_LOCATION ${GFLAGS_LIBRARIES})
 ADD_DEPENDENCIES(gflags extern_gflags)
 
+if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
+  list(APPEND GFLAGS_LIBRARIES pthread)
+endif()
+
 # On Windows (including MinGW), the Shlwapi library is used by gflags if available.
 if (WIN32)
   include(CheckIncludeFileCXX)
   check_include_file_cxx("shlwapi.h" HAVE_SHLWAPI)
   if (HAVE_SHLWAPI)
     set_property(GLOBAL PROPERTY OS_DEPENDENCY_MODULES shlwapi.lib)
+    list(APPEND GFLAGS_LIBRARIES shlwapi.lib)
   endif(HAVE_SHLWAPI)
 endif (WIN32)
diff --git a/examples/CMakeLists.txt b/examples/CMakeLists.txt
index ee46e64b9..5c9fbdce0 100755
--- a/examples/CMakeLists.txt
+++ b/examples/CMakeLists.txt
@@ -48,18 +48,7 @@ function(add_fastdeploy_executable FIELD CC_FILE)
   if(EXISTS ${TEMP_TARGET_FILE} AND TARGET fastdeploy)
     add_executable(${TEMP_TARGET_NAME} ${TEMP_TARGET_FILE})
     target_link_libraries(${TEMP_TARGET_NAME} PUBLIC fastdeploy)
-    if(TARGET gflags)
-      if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
-        target_link_libraries(${TEMP_TARGET_NAME} PRIVATE gflags pthread)
-      elseif(WIN32)
-        target_link_libraries(${TEMP_TARGET_NAME} PRIVATE gflags)
-        if (HAVE_SHLWAPI)
-          target_link_libraries(${TEMP_TARGET_NAME} PRIVATE shlwapi.lib)
-        endif()  
-      else()
-        target_link_libraries(${TEMP_TARGET_NAME} PRIVATE gflags)
-      endif()
-    endif()
+    target_link_libraries(${TEMP_TARGET_NAME} PRIVATE ${GFLAGS_LIBRARIES})
     config_fastdeploy_executable_link_flags(${TEMP_TARGET_NAME})
     math(EXPR _EXAMPLES_NUM "${EXAMPLES_NUM} + 1")
     set(EXAMPLES_NUM ${_EXAMPLES_NUM} PARENT_SCOPE)
diff --git a/examples/vision/facealign/face_landmark_1000/cpp/CMakeLists.txt b/examples/vision/facealign/face_landmark_1000/cpp/CMakeLists.txt
index c417fcb38..74e6eb7e7 100644
--- a/examples/vision/facealign/face_landmark_1000/cpp/CMakeLists.txt
+++ b/examples/vision/facealign/face_landmark_1000/cpp/CMakeLists.txt
@@ -10,9 +10,5 @@ include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
 include_directories(${FASTDEPLOY_INCS})
 
 add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
-# 添加FastDeploy库依赖
-if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
-  target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} gflags pthread)
-else()
-  target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} gflags)
-endif()
+
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} ${GFLAGS_LIBRARIES})
diff --git a/examples/vision/facealign/face_landmark_1000/cpp/README.md b/examples/vision/facealign/face_landmark_1000/cpp/README.md
index 755a20664..00b5391b5 100644
--- a/examples/vision/facealign/face_landmark_1000/cpp/README.md
+++ b/examples/vision/facealign/face_landmark_1000/cpp/README.md
@@ -7,7 +7,7 @@
 - 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
 - 2. 根据开发环境，下载预编译部署库和samples代码，参考[FastDeploy预编译库](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
 
-以Linux上CPU推理为例，在本目录执行如下命令即可完成编译测试，支持此模型需保证FastDeploy版本0.7.0以上(x.x.x>=0.7.0)
+以Linux上CPU推理为例，在本目录执行如下命令即可完成编译测试，支持此模型需保证FastDeploy版本1.0.2以上(x.x.x>=1.0.2), 或使用nightly built版本
 
 ```bash
 mkdir build
diff --git a/examples/vision/facealign/pfld/cpp/CMakeLists.txt b/examples/vision/facealign/pfld/cpp/CMakeLists.txt
index c417fcb38..7d1bd2ee1 100755
--- a/examples/vision/facealign/pfld/cpp/CMakeLists.txt
+++ b/examples/vision/facealign/pfld/cpp/CMakeLists.txt
@@ -10,9 +10,4 @@ include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
 include_directories(${FASTDEPLOY_INCS})
 
 add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
-# 添加FastDeploy库依赖
-if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
-  target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} gflags pthread)
-else()
-  target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} gflags)
-endif()
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} ${GFLAGS_LIBRARIES})
diff --git a/examples/vision/facealign/pfld/cpp/README.md b/examples/vision/facealign/pfld/cpp/README.md
index d061b010a..06ce4a2f4 100644
--- a/examples/vision/facealign/pfld/cpp/README.md
+++ b/examples/vision/facealign/pfld/cpp/README.md
@@ -7,7 +7,7 @@
 - 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
 - 2. 根据开发环境，下载预编译部署库和samples代码，参考[FastDeploy预编译库](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
 
-以Linux上CPU推理为例，在本目录执行如下命令即可完成编译测试，支持此模型需保证FastDeploy版本0.7.0以上(x.x.x>=0.7.0)
+以Linux上CPU推理为例，在本目录执行如下命令即可完成编译测试，支持此模型需保证FastDeploy版本1.0.2以上(x.x.x>=1.0.2), 或使用nightly built版本
 
 ```bash
 mkdir build
diff --git a/examples/vision/facealign/pipnet/cpp/CMakeLists.txt b/examples/vision/facealign/pipnet/cpp/CMakeLists.txt
index c417fcb38..7d1bd2ee1 100644
--- a/examples/vision/facealign/pipnet/cpp/CMakeLists.txt
+++ b/examples/vision/facealign/pipnet/cpp/CMakeLists.txt
@@ -10,9 +10,4 @@ include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
 include_directories(${FASTDEPLOY_INCS})
 
 add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
-# 添加FastDeploy库依赖
-if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
-  target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} gflags pthread)
-else()
-  target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} gflags)
-endif()
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} ${GFLAGS_LIBRARIES})
diff --git a/examples/vision/headpose/fsanet/cpp/CMakeLists.txt b/examples/vision/headpose/fsanet/cpp/CMakeLists.txt
index c417fcb38..7d1bd2ee1 100755
--- a/examples/vision/headpose/fsanet/cpp/CMakeLists.txt
+++ b/examples/vision/headpose/fsanet/cpp/CMakeLists.txt
@@ -10,9 +10,4 @@ include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
 include_directories(${FASTDEPLOY_INCS})
 
 add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
-# 添加FastDeploy库依赖
-if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
-  target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} gflags pthread)
-else()
-  target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} gflags)
-endif()
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS} ${GFLAGS_LIBRARIES})
diff --git a/examples/vision/headpose/fsanet/cpp/README.md b/examples/vision/headpose/fsanet/cpp/README.md
index 51e0a179d..1d1b1e943 100755
--- a/examples/vision/headpose/fsanet/cpp/README.md
+++ b/examples/vision/headpose/fsanet/cpp/README.md
@@ -7,7 +7,7 @@
 - 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
 - 2. 根据开发环境，下载预编译部署库和samples代码，参考[FastDeploy预编译库](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
 
-以Linux上CPU推理为例，在本目录执行如下命令即可完成编译测试，支持此模型需保证FastDeploy版本0.7.0以上(x.x.x>=0.7.0)
+以Linux上CPU推理为例，在本目录执行如下命令即可完成编译测试，支持此模型需保证FastDeploy版本1.0.2以上(x.x.x>=1.0.2), 或使用nightly built版本
 
 ```bash
 mkdir build
diff --git a/tutorials/intel_gpu/README.md b/tutorials/intel_gpu/README.md
new file mode 100644
index 000000000..7c641f512
--- /dev/null
+++ b/tutorials/intel_gpu/README.md
@@ -0,0 +1,57 @@
+English | [中文](README_CN.md)
+
+# Deploy on Intel GPU
+
+Intel GPU is supported by OpenVINO backend in FastDeploy. There're two notices while inference on Intel GPU
+
+- The model's inputs shape have to be fixed
+- There may exists some operators supported on CPU but not supported on GPU
+
+FastDeploy provides two examples for these situations in this directory
+
+## Fixed input shape
+
+While deploying a computer vision model, it includes 3 steps
+- Input a image data, after the preprocessing steps, we get the `tensors` which will be feed to the deeplearning model
+- Inference the model by Runtime with the input `tensors`, and get the output `tensors`
+- Postprocessing the output `tensors`, and get the final results we need, e.g `DetectionResult`, `SegmentationResult`
+
+Fixed input shape means that the shape of the `tensors` received by the runtime is the same each time and cannot be changed. Such as PP-OCR and RCNN, the shape of each input to the model is changing, so it is not supported on Intel GPU temporarily. For PaddleClas model, PP-YOLOE, PicoDet, YOLOv5, etc., the input shape after each preprocessing is the same, which can be supported.
+
+At the same time, when we export the deployment model from the framework, we may not have fixed the shape. For example, the ResNet50 model of PaddleClas receives [1, 3, 224, 224] size data all the time during reasoning, but actually when we export the model, the input shape is set to [- 1, 3, - 1, - 1], which also causes OpenVINO to be unable to confirm the input shape of the model.
+
+FastDeploy provides the following interfaces to help fix the shape of the model
+
+- Python: `RuntimeOption.set_openvino_shape_info()`
+- C++: `RuntimeOption::SetOpenVINOShapeInfo()`
+
+## Operators supporting
+
+In essence, the deep learning model is a topological directed graph, and each node in the graph is an operator OP (Operator). Due to the implementation of different inference engine codes, the number of OPs supported by each backend is inconsistent. For OpenVINO, the number of OPs supported on the CPU and GPU is different, which means that the same model can run on the CPU, but may not be able to run on the GPU. Taking PP-YOLOE as an example, when running directly on the GPU, the following prompt will appear, which means that the 'MulticlassNms' OP is not supported by the GPU.
+
+```
+RuntimeError: Operation: multiclass_nms3_0.tmp_1 of type MulticlassNms(op::v0) is not supported
+```
+
+In this case, we can execute the model in a heterogeneous way, that is, let the unsupported OPs run on the CPU, and the remaining OPs still run on the GPU.
+
+Heterogeneous execution is used through the settings of the following interfaces
+
+**Python**
+
+```
+import fastdeploy as fd
+option = fd.RuntimeOption()
+option.use_openvino_backend()
+option.set_openvino_device("HETERO:GPU,CPU")
+option.set_openvino_cpu_operators(["MulticlassNms"])
+```
+
+**C++**
+
+```
+fastdeploy::RuntimeOption option;
+option.UseOpenVINOBackend();
+option.SetOpenVINODevice("HETERO:GPU,CPU");
+option.SetOpenVINOCpuOperators({"MulticlassNms"});
+```
diff --git a/tutorials/intel_gpu/README_CN.md b/tutorials/intel_gpu/README_CN.md
new file mode 100644
index 000000000..8552e8827
--- /dev/null
+++ b/tutorials/intel_gpu/README_CN.md
@@ -0,0 +1,54 @@
+[English](README.md) | 中文
+
+# Intel GPU(独立显卡/集成显卡)的使用
+
+FastDeploy通过OpenVINO后端支持Intel GPU显卡的使用。整体在部署模型时，与现有FastDeploy部署其它模型的流程类似，但在GPU上推理存在以下2个注意事项
+
+- OpenVINO在显卡上推理时，要求模型的输入保持固定
+- OpenVINO在显卡上支持的OP数量，与CPU不一致，需要异构执行
+
+目前PaddleClas中所有OP均可使用GPU运行，而一些模型如PPYOLOE，则需要异构执行。具体使用示例可参考此目录下示例
+
+## 输入固定说明
+
+针对一个视觉模型的推理包含3个环节
+- 输入图像，图像经过预处理，最终得到要输入给模型Runtime的Tensor
+- 模型Runtime接收Tensor，进行推理，得到Runtime的输出Tensor
+- 对Runtime的输出Tensor做后处理，得到最后的结构化信息，如DetectionResult, SegmentationResult等等
+
+而输入固定，也即表示要求Runtime接收的Tensor，每次数据大小是一样的，不能变化。现有FastDeploy中，例如PP-OCR, RCNN这些每次输入给模型的大小就是在不断变化的（），因此暂不支持。而对于PaddleClas模型、PP-YOLOE、PicoDet，YOLOv5等，每次预处理后的数据大小是一样，则可以支持。
+
+同时，我们在从框架导出部署模型时，可能也未进行Shape固定，例如PaddleClas的ResNet50模型，虽然推理时，一直接收的是[1, 3, 224, 224]大小的数据，但实际上导出模型时，输入的Shape被设定为了[-1, 3, -1, -1]，这也会导致OpenVINO无法确认模型的输入Shape。
+
+FastDeploy提供如下接口，帮助来固定模型的Shape
+
+- Python: `RuntimeOption.set_openvino_shape_info()`
+- C++: `RuntimeOption::SetOpenVINOShapeInfo()`
+
+## OP支持说明
+
+深度学习模型本质是一个拓扑有向图，而图中的每一个节点，即为一个算子OP(Operator)。受限于不同推理引擎代码的实现，各后端支持的OP数量不一致。对于OpenVINO而言，在CPU和GPU上同样支持的OP数量不同，这也就意味着，同样一个模型使用OpenVINO可以跑在CPU上，但不一定能跑在GPU上。以PP-YOLOE为例，在GPU上直接跑，会出现如下提示，即表示`MulticlassNms`这个OP不被GPU支持。
+```
+RuntimeError: Operation: multiclass_nms3_0.tmp_1 of type MulticlassNms(op::v0) is not supported
+```
+
+这种情况下，我们可以通过异构的方式来执行模型，即让不支持的OP跑在CPU上，其余OP仍然在GPU上跑。
+
+通过如下接口的设定，使用异构执行
+
+### Python
+```
+import fastdeploy as fd
+option = fd.RuntimeOption()
+option.use_openvino_backend()
+option.set_openvino_device("HETERO:GPU,CPU")
+option.set_openvino_cpu_operators(["MulticlassNms"])
+```
+
+### C++
+```
+fastdeploy::RuntimeOption option;
+option.UseOpenVINOBackend();
+option.SetOpenVINODevice("HETERO:GPU,CPU");
+option.SetOpenVINOCpuOperators({"MulticlassNms"});
+```
diff --git a/tutorials/intel_gpu/cpp/CMakeLists.txt b/tutorials/intel_gpu/cpp/CMakeLists.txt
new file mode 100644
index 000000000..41b0ebabd
--- /dev/null
+++ b/tutorials/intel_gpu/cpp/CMakeLists.txt
@@ -0,0 +1,20 @@
+PROJECT(infer_demo C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+# specify the decompress directory of FastDeploy SDK
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+include(${FASTDEPLOY_INSTALL_DIR}/utils/gflags.cmake)
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+
+include_directories(${FASTDEPLOY_INCS})
+
+add_executable(infer_resnet50 ${PROJECT_SOURCE_DIR}/infer_resnet50.cc)
+add_executable(infer_ppyoloe ${PROJECT_SOURCE_DIR}/infer_ppyoloe.cc)
+
+if(UNIX AND (NOT APPLE) AND (NOT ANDROID))
+  target_link_libraries(infer_resnet50 ${FASTDEPLOY_LIBS} gflags pthread)
+  target_link_libraries(infer_ppyoloe ${FASTDEPLOY_LIBS} gflags pthread)
+else()
+  target_link_libraries(infer_resnet50 ${FASTDEPLOY_LIBS} gflags)
+  target_link_libraries(infer_ppyoloe ${FASTDEPLOY_LIBS} gflags)
+endif()
diff --git a/tutorials/intel_gpu/cpp/README.md b/tutorials/intel_gpu/cpp/README.md
new file mode 100644
index 000000000..80f614610
--- /dev/null
+++ b/tutorials/intel_gpu/cpp/README.md
@@ -0,0 +1,52 @@
+English | [中文](README_CN.md)
+
+# PaddleClas Python Example
+
+Before deployment, confirm the following two steps
+
+- 1. The software and hardware environment meet the requirements. Refer to [FastDeploy Environment Requirements](../../../docs/en/build_and_install/download_prebuilt_libraries.md)
+- 2. Install FastDeploy Python wheel package. Refer to [Install FastDeploy](../../../docs/en/build_and_install/download_prebuilt_libraries.md)
+
+**Notice** This doc require FastDeploy version >= 1.0.2, or just use nightly built version.
+
+```bash
+# Get FastDeploy codes
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/tutorials/intel_gpu/cpu
+
+mkdir build && cd build
+
+# Please the preparation step to get the download link
+wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz
+tar xvf fastdeploy-linux-x64-x.x.x.tgz
+
+# Download PaddleClas model and test image
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz
+wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
+tar -xvf ResNet50_vd_infer.tgz
+
+cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
+make -j
+
+# Inference with CPU
+./infer_resnet50 -model ResNet50_vd_infer -image ILSVRC2012_val_00000010.jpeg -device cpu -topk 3
+
+# Inference with Intel GPU
+./infer_resnet50 -model ResNet50_vd_infer -image ILSVRC2012_val_00000010.jpeg -device intel_gpu -topk 3
+
+
+# Download PaddleDetection/PP-YOLOE model and test image
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+
+# Inference with CPU
+./infer_ppyoloe -model ppyoloe_crn_l_300e_coco -image 000000014439.jpg -device cpu
+
+# Inference with Intel GPU
+./infer_ppyoloe -model ppyoloe_crn_l_300e_coco -image 000000014439.jpg -device intel_gpu
+```
+
+This documents only shows how to compile on Linux/Mac, if you are using Windows, please refer the following documents
+
+- [How to use FastDeploy C++ SDK on Windows](../../../docs/en/faq/use_sdk_on_windows.md)
diff --git a/tutorials/intel_gpu/cpp/README_CN.md b/tutorials/intel_gpu/cpp/README_CN.md
new file mode 100644
index 000000000..e8e5de523
--- /dev/null
+++ b/tutorials/intel_gpu/cpp/README_CN.md
@@ -0,0 +1,52 @@
+English | [中文](README_CN.md)
+
+# PaddleClas Python Example
+
+在部署前，需确认以下两个步骤
+
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
+- 2. FastDeploy Python whl包安装，参考[FastDeploy Python安装](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+**注意** 本文档依赖FastDeploy>=1.0.2版本，或nightly built版本。
+
+```bash
+# Get FastDeploy codes
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/tutorials/intel_gpu/cpu
+
+mkdir build && cd build
+
+# Please the preparation step to get the download link
+wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz
+tar xvf fastdeploy-linux-x64-x.x.x.tgz
+
+# Download PaddleClas model and test image
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz
+wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
+tar -xvf ResNet50_vd_infer.tgz
+
+cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
+make -j
+
+# Inference with CPU
+./infer_resnet50 -model ResNet50_vd_infer -image ILSVRC2012_val_00000010.jpeg -device cpu -topk 3
+
+# Inference with Intel GPU
+./infer_resnet50 -model ResNet50_vd_infer -image ILSVRC2012_val_00000010.jpeg -device intel_gpu -topk 3
+
+
+# Download PaddleDetection/PP-YOLOE model and test image
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+
+# Inference with CPU
+./infer_ppyoloe -model ppyoloe_crn_l_300e_coco -image 000000014439.jpg -device cpu
+
+# Inference with Intel GPU
+./infer_ppyoloe -model ppyoloe_crn_l_300e_coco -image 000000014439.jpg -device intel_gpu
+```
+
+这篇文档展示的是如何在Linux/Mac上编译和运行，如果你是使用Windows系统，请参考下面的文档进行使用
+
+- [Windows上使用FastDeploy C++ SDK](../../../docs/cn/faq/use_sdk_on_windows.md)
diff --git a/tutorials/intel_gpu/cpp/infer_ppyoloe.cc b/tutorials/intel_gpu/cpp/infer_ppyoloe.cc
new file mode 100644
index 000000000..ce3217d53
--- /dev/null
+++ b/tutorials/intel_gpu/cpp/infer_ppyoloe.cc
@@ -0,0 +1,100 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+#include "gflags/gflags.h"
+
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+DEFINE_string(model, "", "Directory of the inference model");
+DEFINE_string(image, "", "Path of the image file.");
+
+DEFINE_string(device, "cpu", "Type of openvino device, 'cpu' or 'intel_gpu'");
+
+void InitAndInfer(const std::string& model_dir, const std::string& image_file, const fastdeploy::RuntimeOption& option) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto model = fastdeploy::vision::detection::PPYOLOE(
+      model_file, params_file, config_file, option);
+
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  std::cout << "Warmup 20 times..." << std::endl;
+  for (int i = 0; i < 20; ++i) {
+    fastdeploy::vision::DetectionResult res;
+    if (!model.Predict(im, &res)) {
+      std::cerr << "Failed to predict." << std::endl;
+      return;
+    }
+  }
+
+  std::cout << "Counting time..." << std::endl;
+  fastdeploy::TimeCounter tc;
+  tc.Start();
+  for (int i = 0; i < 50; ++i) {
+    fastdeploy::vision::DetectionResult res;
+    if (!model.Predict(im, &res)) {
+      std::cerr << "Failed to predict." << std::endl;
+      return;
+    }
+  }
+  tc.End();
+  std::cout << "Elapsed time: " << tc.Duration() * 1000 << "ms." << std::endl;
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  cv::Mat vis_im = fastdeploy::vision::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+fastdeploy::RuntimeOption BuildOption(const std::string& device) {
+  if (device != "cpu" && device != "intel_gpu") {
+    std::cerr << "The flag device only can be 'cpu' or 'intel_gpu'" << std::endl;
+    std::abort();
+  }
+  fastdeploy::RuntimeOption option;
+  option.UseOpenVINOBackend();
+  if (device == "intel_gpu") {
+    option.SetOpenVINODevice("HETERO:GPU,CPU");
+    std::map<std::string, std::vector<int64_t>> shape_info;
+    shape_info["image"] = {1, 3, 640, 640};
+    shape_info["scale_factor"] = {1, 2};
+    option.SetOpenVINOShapeInfo(shape_info);
+    option.SetOpenVINOCpuOperators({"MulticlassNms"});
+  }
+  return option;
+}
+
+int main(int argc, char* argv[]) {
+  google::ParseCommandLineFlags(&argc, &argv, true);
+  auto option = BuildOption(FLAGS_device);
+  InitAndInfer(FLAGS_model, FLAGS_image, option);
+  return 0;
+}
diff --git a/tutorials/intel_gpu/cpp/infer_resnet50.cc b/tutorials/intel_gpu/cpp/infer_resnet50.cc
new file mode 100644
index 000000000..740032fd1
--- /dev/null
+++ b/tutorials/intel_gpu/cpp/infer_resnet50.cc
@@ -0,0 +1,100 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+#include "gflags/gflags.h"
+
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+DEFINE_string(model, "", "Directory of the inference model");
+DEFINE_string(image, "", "Path of the image file.");
+DEFINE_int64(topk, 1, "Topk classify result of the image file");
+
+DEFINE_string(device, "cpu", "Type of openvino device, 'cpu' or 'intel_gpu'");
+
+void InitAndInfer(const std::string& model_dir, const std::string& image_file, int topk, const fastdeploy::RuntimeOption& option) {
+  auto model_file = model_dir + sep + "inference.pdmodel";
+  auto params_file = model_dir + sep + "inference.pdiparams";
+  auto config_file = model_dir + sep + "inference_cls.yaml";
+
+  auto model = fastdeploy::vision::classification::PaddleClasModel(
+      model_file, params_file, config_file, option);
+
+  model.GetPostprocessor().SetTopk(topk);
+
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  std::cout << "Warmup 20 times..." << std::endl;
+  for (int i = 0; i < 20; ++i) {
+    fastdeploy::vision::ClassifyResult res;
+    if (!model.Predict(im, &res)) {
+      std::cerr << "Failed to predict." << std::endl;
+      return;
+    }
+  }
+
+  std::cout << "Counting time..." << std::endl;
+  fastdeploy::TimeCounter tc;
+  tc.Start();
+  for (int i = 0; i < 50; ++i) {
+    fastdeploy::vision::ClassifyResult res;
+    if (!model.Predict(im, &res)) {
+      std::cerr << "Failed to predict." << std::endl;
+      return;
+    }
+  }
+  tc.End();
+  std::cout << "Elapsed time: " << tc.Duration() * 1000 << "ms." << std::endl;
+
+
+  fastdeploy::vision::ClassifyResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  // print res
+  std::cout << res.Str() << std::endl;
+}
+
+fastdeploy::RuntimeOption BuildOption(const std::string& device) {
+  if (device != "cpu" && device != "intel_gpu") {
+    std::cerr << "The flag device only can be 'cpu' or 'intel_gpu'" << std::endl;
+    std::abort();
+  }
+  fastdeploy::RuntimeOption option;
+  option.UseOpenVINOBackend();
+  if (device == "intel_gpu") {
+    option.SetOpenVINODevice("GPU");
+    std::map<std::string, std::vector<int64_t>> shape_info;
+    shape_info["inputs"] = {1, 3, 224, 224};
+    option.SetOpenVINOShapeInfo(shape_info);
+  }
+  return option;
+}
+
+int main(int argc, char* argv[]) {
+  google::ParseCommandLineFlags(&argc, &argv, true);
+  auto option = BuildOption(FLAGS_device);
+  InitAndInfer(FLAGS_model, FLAGS_image, FLAGS_topk, option);
+  return 0;
+}
diff --git a/tutorials/intel_gpu/python/README.md b/tutorials/intel_gpu/python/README.md
new file mode 100644
index 000000000..29324ab92
--- /dev/null
+++ b/tutorials/intel_gpu/python/README.md
@@ -0,0 +1,38 @@
+English | [中文](README_CN.md)
+
+# PaddleClas Python Example
+
+Before deployment, confirm the following two steps
+
+- 1. The software and hardware environment meet the requirements. Refer to [FastDeploy Environment Requirements](../../../docs/en/build_and_install/download_prebuilt_libraries.md)
+- 2. Install FastDeploy Python wheel package. Refer to [Install FastDeploy](../../../docs/en/build_and_install/download_prebuilt_libraries.md)
+
+```bash
+# Get FastDeploy codes
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/tutorials/intel_gpu/python
+
+# Download PaddleClas model and test image
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz
+wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
+tar -xvf ResNet50_vd_infer.tgz
+
+# Inference with CPU
+python infer_resnet50.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device cpu --topk 1
+
+# Inference with Intel GPU
+python infer_resnet50.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device intel_gpu --topk 1
+
+
+
+# Download PaddleDetection/PP-YOLOE model and test image
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+
+# Inference with CPU
+python infer_ppyoloe.py --model ppyoloe_crn_l_300e_coco --image 000000014439.jpg --device cpu
+
+# Inference with Intel GPU
+python infer_ppyoloe.py --model ppyoloe_crn_l_300e_coco --image 000000014439.jpg --device intel_gpu
+```
diff --git a/tutorials/intel_gpu/python/README_CN.md b/tutorials/intel_gpu/python/README_CN.md
new file mode 100644
index 000000000..178125031
--- /dev/null
+++ b/tutorials/intel_gpu/python/README_CN.md
@@ -0,0 +1,37 @@
+English | [中文](README_CN.md)
+
+# PaddleClas Python Example
+
+在部署前，需确认以下两个步骤
+
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
+- 2. FastDeploy Python whl包安装，参考[FastDeploy Python安装](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+```bash
+# Get FastDeploy codes
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/tutorials/intel_gpu/python
+
+# Download model and test image
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz
+tar -xvf ResNet50_vd_infer.tgz
+wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
+
+# Inference with CPU
+python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device cpu --topk 1
+
+# Inference with Intel GPU
+python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device intel_gpu --topk 1
+
+
+# Download PaddleDetection/PP-YOLOE model and test image
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+
+# Inference with CPU
+python infer_ppyoloe.py --model ppyoloe_crn_l_300e_coco --image 000000014439.jpg --device cpu
+
+# Inference with Intel GPU
+python infer_ppyoloe.py --model ppyoloe_crn_l_300e_coco --image 000000014439.jpg --device intel_gpu
+```
diff --git a/tutorials/intel_gpu/python/infer_ppyoloe.py b/tutorials/intel_gpu/python/infer_ppyoloe.py
new file mode 100644
index 000000000..6d5398a5d
--- /dev/null
+++ b/tutorials/intel_gpu/python/infer_ppyoloe.py
@@ -0,0 +1,65 @@
+import fastdeploy as fd
+import cv2
+import os
+import time
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model", required=True, help="Path of PP-YOLOE model.")
+    parser.add_argument(
+        "--image", type=str, required=True, help="Path of test image file.")
+    parser.add_argument(
+        "--device",
+        type=str,
+        default='cpu',
+        help="Type of inference device, support 'cpu' or 'intel_gpu'.")
+    return parser.parse_args()
+
+
+def build_option(args):
+    option = fd.RuntimeOption()
+    option.use_openvino_backend()
+
+    assert args.device.lower(
+    ) in ["cpu", "intel_gpu"], "--device only support ['cpu', 'intel_gpu']"
+
+    if args.device.lower() == "intel_gpu":
+        option.set_openvino_device("HETERO:GPU,CPU")
+        option.set_openvino_shape_info({
+            "image": [1, 3, 640, 640],
+            "scale_factor": [1, 2]
+        })
+        option.set_openvino_cpu_operators(["MulticlassNms"])
+    return option
+
+
+args = parse_arguments()
+
+runtime_option = build_option(args)
+
+model_file = os.path.join(args.model, "model.pdmodel")
+params_file = os.path.join(args.model, "model.pdiparams")
+config_file = os.path.join(args.model, "infer_cfg.yml")
+model = fd.vision.detection.PPYOLOE(
+    model_file, params_file, config_file, runtime_option=runtime_option)
+
+im = cv2.imread(args.image)
+
+print("Warmup 20 times...")
+for i in range(20):
+    result = model.predict(im)
+
+print("Counting time...")
+start = time.time()
+for i in range(50):
+    result = model.predict(im)
+end = time.time()
+print("Elapsed time: {}ms".format((end - start) * 1000))
+
+vis_im = fd.vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("visualized_result.jpg", vis_im)
+print("Visualized result save in ./visualized_result.jpg")
diff --git a/tutorials/intel_gpu/python/infer_resnet50.py b/tutorials/intel_gpu/python/infer_resnet50.py
new file mode 100644
index 000000000..f4b721c17
--- /dev/null
+++ b/tutorials/intel_gpu/python/infer_resnet50.py
@@ -0,0 +1,61 @@
+import fastdeploy as fd
+import cv2
+import os
+import time
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model", required=True, help="Path of PaddleClas model.")
+    parser.add_argument(
+        "--image", type=str, required=True, help="Path of test image file.")
+    parser.add_argument(
+        "--topk", type=int, default=1, help="Return topk results.")
+    parser.add_argument(
+        "--device",
+        type=str,
+        default='cpu',
+        help="Type of inference device, support 'cpu' or 'intel_gpu'.")
+    return parser.parse_args()
+
+
+def build_option(args):
+    option = fd.RuntimeOption()
+    option.use_openvino_backend()
+
+    assert args.device.lower(
+    ) in ["cpu", "intel_gpu"], "--device only support ['cpu', 'intel_gpu']"
+
+    if args.device.lower() == "intel_gpu":
+        option.set_openvino_device("GPU")
+        option.set_openvino_shape_info({"inputs": [1, 3, 224, 224]})
+
+    return option
+
+
+args = parse_arguments()
+
+runtime_option = build_option(args)
+
+model_file = os.path.join(args.model, "inference.pdmodel")
+params_file = os.path.join(args.model, "inference.pdiparams")
+config_file = os.path.join(args.model, "inference_cls.yaml")
+model = fd.vision.classification.PaddleClasModel(
+    model_file, params_file, config_file, runtime_option=runtime_option)
+
+im = cv2.imread(args.image)
+
+print("Warmup 20 times...")
+for i in range(20):
+    result = model.predict(im, args.topk)
+
+print("Counting time...")
+start = time.time()
+for i in range(50):
+    result = model.predict(im, args.topk)
+end = time.time()
+print("Elapsed time: {}ms".format((end - start) * 1000))
+print(result)

From 51a992ca90a948959735c089742eda5ce354cfe2 Mon Sep 17 00:00:00 2001
From: DefTruth <31974251+DefTruth@users.noreply.github.com>
Date: Tue, 13 Dec 2022 10:54:51 +0800
Subject: [PATCH 29/77] [Doc] Update download_prebuilt_libraries.md (linux
 aarch64 1.0.1) (#867)

Update download_prebuilt_libraries.md
---
 docs/cn/build_and_install/download_prebuilt_libraries.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/cn/build_and_install/download_prebuilt_libraries.md b/docs/cn/build_and_install/download_prebuilt_libraries.md
index 1a2c4f94e..3ec302801 100755
--- a/docs/cn/build_and_install/download_prebuilt_libraries.md
+++ b/docs/cn/build_and_install/download_prebuilt_libraries.md
@@ -83,7 +83,7 @@ Release版本
 | Windows x64 | [fastdeploy-win-x64-1.0.1.zip](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-win-x64-1.0.1.zip) | Visual Studio 16 2019编译产出 |
 | Mac OSX x64 | [fastdeploy-osx-x86_64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-x86_64-1.0.1.tgz) | clang++ 10.0.0编译产出|
 | Mac OSX arm64 | [fastdeploy-osx-arm64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-osx-arm64-1.0.1.tgz) | clang++ 13.0.0编译产出 |
-| Linux aarch64 | [fastdeploy-osx-arm64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-aarch64-1.0.1.tgz) | gcc 6.3编译产出 |  
+| Linux aarch64 | [fastdeploy-linux-aarch64-1.0.1.tgz](https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-aarch64-1.0.1.tgz) | gcc 6.3编译产出 |  
 | Android armv7&v8 | [fastdeploy-android-1.0.0-shared.tgz](https://bj.bcebos.com/fastdeploy/release/android/fastdeploy-android-1.0.0-shared.tgz) | NDK 25及clang++编译产出, 支持arm64-v8a及armeabi-v7a |
 
 ## Java SDK安装

From 7a1922b88fcee46b45b5b4d55ed52656ab2216aa Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Tue, 13 Dec 2022 10:57:34 +0800
Subject: [PATCH 30/77] Update jetson.md

---
 docs/cn/build_and_install/jetson.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/cn/build_and_install/jetson.md b/docs/cn/build_and_install/jetson.md
index 97ab59083..07ab53a61 100644
--- a/docs/cn/build_and_install/jetson.md
+++ b/docs/cn/build_and_install/jetson.md
@@ -1,7 +1,7 @@
 
 # Jetson部署库编译
 
-FastDeploy当前在Jetson仅支持ONNX Runtime CPU和TensorRT GPU/Paddle Inference两种后端推理
+FastDeploy当前在Jetson仅支持ONNX Runtime CPU和TensorRT GPU/Paddle Inference三种后端推理
 
 ## C++ SDK编译安装
 

From f6e8fe7427395f2bfd5630a93a1fcb7a3e40cf35 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Tue, 13 Dec 2022 11:24:17 +0800
Subject: [PATCH 31/77] Update README.md

---
 examples/vision/detection/paddledetection/README.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/examples/vision/detection/paddledetection/README.md b/examples/vision/detection/paddledetection/README.md
index 4da1ba7e9..575b305bb 100644
--- a/examples/vision/detection/paddledetection/README.md
+++ b/examples/vision/detection/paddledetection/README.md
@@ -23,6 +23,7 @@
 
 **注意**
 - 在导出模型时不要进行NMS的去除操作，正常导出即可  
+- 如果用于跑原生TensorRT后端（非Paddle Inference后端），不要添加--trt参数
 - 导出模型时，不要添加`fuse_normalize=True`参数
 
 ## 下载预训练模型
@@ -49,4 +50,4 @@
 ## 详细部署文档
 
 - [Python部署](python)
-- [C++部署](cpp)
\ No newline at end of file
+- [C++部署](cpp)

From 6a1a3d001fd4b6a4ed58181c58b8b8ea764a99c5 Mon Sep 17 00:00:00 2001
From: yeliang2258 <30516196+yeliang2258@users.noreply.github.com>
Date: Tue, 13 Dec 2022 11:53:36 +0800
Subject: [PATCH 32/77] [Backend] A311D support (#825)

* add A311D support

* update code

* update toolchain

* update opencv_armhf lib

* update libs

* update code

* add install script

* update bos link

* update toolchain
---
 cmake/opencv.cmake                            |  22 ++--
 cmake/paddlelite.cmake                        |  28 +++--
 cmake/timvx.cmake                             |  91 +++++++--------
 cmake/toolchain.cmake                         |  38 +++++++
 docs/cn/build_and_install/README.md           |   3 +-
 docs/cn/build_and_install/a311d.md            | 107 ++++++++++++++++++
 docs/cn/build_and_install/rv1126.md           |  13 ++-
 .../classification/paddleclas/a311d/README.md |  11 ++
 .../paddleclas/a311d/cpp/CMakeLists.txt       |  38 +++++++
 .../paddleclas/a311d/cpp/README.md            |  53 +++++++++
 .../paddleclas/a311d/cpp/infer.cc             |  60 ++++++++++
 .../paddleclas/a311d/cpp/run_with_adb.sh      |  47 ++++++++
 .../paddleclas/rv1126/cpp/README.md           |   2 +-
 .../paddleclas/rv1126/cpp/infer.cc            |   1 -
 .../detection/paddledetection/a311d/README.md |  11 ++
 .../paddledetection/a311d/cpp/CMakeLists.txt  |  38 +++++++
 .../paddledetection/a311d/cpp/README.md       |  55 +++++++++
 .../a311d/cpp/infer_ppyoloe.cc                |  65 +++++++++++
 .../paddledetection/a311d/cpp/run_with_adb.sh |  47 ++++++++
 .../paddledetection/rv1126/cpp/README.md      |   2 +-
 .../rv1126/cpp/infer_ppyoloe.cc               |   1 -
 .../vision/detection/yolov5/a311d/README.md   |  11 ++
 .../detection/yolov5/a311d/cpp/CMakeLists.txt |  37 ++++++
 .../detection/yolov5/a311d/cpp/README.md      |  54 +++++++++
 .../detection/yolov5/a311d/cpp/infer.cc       |  64 +++++++++++
 .../yolov5/a311d/cpp/run_with_adb.sh          |  47 ++++++++
 .../detection/yolov5/rv1126/cpp/README.md     |   2 +-
 .../segmentation/paddleseg/a311d/README.md    |  11 ++
 .../paddleseg/a311d/cpp/CMakeLists.txt        |  38 +++++++
 .../paddleseg/a311d/cpp/README.md             |  54 +++++++++
 .../segmentation/paddleseg/a311d/cpp/infer.cc |  65 +++++++++++
 .../paddleseg/a311d/cpp/run_with_adb.sh       |  47 ++++++++
 .../paddleseg/rv1126/cpp/README.md            |   2 +-
 .../paddleseg/rv1126/cpp/infer.cc             |   1 -
 .../vision/detection/contrib/rknpu2/utils.h   |   1 +
 tools/timvx/install.sh                        |  17 +++
 36 files changed, 1096 insertions(+), 88 deletions(-)
 create mode 100755 cmake/toolchain.cmake
 create mode 100755 docs/cn/build_and_install/a311d.md
 create mode 100755 examples/vision/classification/paddleclas/a311d/README.md
 create mode 100755 examples/vision/classification/paddleclas/a311d/cpp/CMakeLists.txt
 create mode 100755 examples/vision/classification/paddleclas/a311d/cpp/README.md
 create mode 100755 examples/vision/classification/paddleclas/a311d/cpp/infer.cc
 create mode 100755 examples/vision/classification/paddleclas/a311d/cpp/run_with_adb.sh
 create mode 100755 examples/vision/detection/paddledetection/a311d/README.md
 create mode 100755 examples/vision/detection/paddledetection/a311d/cpp/CMakeLists.txt
 create mode 100755 examples/vision/detection/paddledetection/a311d/cpp/README.md
 create mode 100755 examples/vision/detection/paddledetection/a311d/cpp/infer_ppyoloe.cc
 create mode 100755 examples/vision/detection/paddledetection/a311d/cpp/run_with_adb.sh
 create mode 100755 examples/vision/detection/yolov5/a311d/README.md
 create mode 100755 examples/vision/detection/yolov5/a311d/cpp/CMakeLists.txt
 create mode 100755 examples/vision/detection/yolov5/a311d/cpp/README.md
 create mode 100755 examples/vision/detection/yolov5/a311d/cpp/infer.cc
 create mode 100755 examples/vision/detection/yolov5/a311d/cpp/run_with_adb.sh
 create mode 100755 examples/vision/segmentation/paddleseg/a311d/README.md
 create mode 100755 examples/vision/segmentation/paddleseg/a311d/cpp/CMakeLists.txt
 create mode 100755 examples/vision/segmentation/paddleseg/a311d/cpp/README.md
 create mode 100755 examples/vision/segmentation/paddleseg/a311d/cpp/infer.cc
 create mode 100755 examples/vision/segmentation/paddleseg/a311d/cpp/run_with_adb.sh
 create mode 100644 tools/timvx/install.sh

diff --git a/cmake/opencv.cmake b/cmake/opencv.cmake
index 87f8c8bcd..fd2ecabe4 100755
--- a/cmake/opencv.cmake
+++ b/cmake/opencv.cmake
@@ -41,12 +41,6 @@ elseif(IOS)
 else()
   if(CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "aarch64")
     set(OPENCV_FILENAME "opencv-linux-aarch64-3.4.14")
-  else()
-    if(ENABLE_TIMVX)
-      set(OPENCV_FILENAME "opencv-armv7hf")
-    else()
-      set(OPENCV_FILENAME "opencv-linux-x64-3.4.16")
-    endif()
   endif()
   if(ENABLE_OPENCV_CUDA)
     if(CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "aarch64")
@@ -56,15 +50,20 @@ else()
   endif()
 endif()
 
+if(NOT OPENCV_FILENAME)
+  set(OPENCV_FILENAME "opencv-linux-x64-3.4.16")
+endif()
+
 set(OPENCV_INSTALL_DIR ${THIRD_PARTY_PATH}/install/)
 if(ANDROID)
   set(OPENCV_URL_PREFIX "https://bj.bcebos.com/fastdeploy/third_libs")
-elseif(ENABLE_TIMVX)
-  set(OPENCV_URL_PREFIX "https://bj.bcebos.com/fastdeploy/test")
 else() # TODO: use fastdeploy/third_libs instead.
   set(OPENCV_URL_PREFIX "https://bj.bcebos.com/paddle2onnx/libs")
 endif()
-set(OPENCV_URL ${OPENCV_URL_PREFIX}/${OPENCV_FILENAME}${COMPRESSED_SUFFIX})
+if(NOT OPENCV_URL)
+  set(OPENCV_URL ${OPENCV_URL_PREFIX}/${OPENCV_FILENAME}${COMPRESSED_SUFFIX})
+endif()
+
 
 if(BUILD_ON_JETSON)
   if(EXISTS /usr/lib/aarch64-linux-gnu/cmake/opencv4/)
@@ -186,9 +185,8 @@ else()
     endif()
     file(RENAME ${THIRD_PARTY_PATH}/install/${OPENCV_FILENAME}/ ${THIRD_PARTY_PATH}/install/opencv)
     set(OPENCV_FILENAME opencv)
-    set(OpenCV_DIR ${THIRD_PARTY_PATH}/install/${OPENCV_FILENAME})
-    if(ENABLE_TIMVX)
-      set(OpenCV_DIR ${OpenCV_DIR}/lib/cmake/opencv4)
+    if(NOT OpenCV_DIR)
+      set(OpenCV_DIR ${THIRD_PARTY_PATH}/install/${OPENCV_FILENAME})
     endif()
     if (WIN32)
       set(OpenCV_DIR ${OpenCV_DIR}/build)
diff --git a/cmake/paddlelite.cmake b/cmake/paddlelite.cmake
index bcc0eb470..74525b7a9 100755
--- a/cmake/paddlelite.cmake
+++ b/cmake/paddlelite.cmake
@@ -49,22 +49,20 @@ if(ANDROID)
   endif()  
 endif()
 
-if(WIN32 OR APPLE OR IOS)
-  message(FATAL_ERROR "Doesn't support windows/mac/ios platform with backend Paddle Lite now.")
-elseif(ANDROID)
-  set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-android-${ANDROID_ABI}-latest-dev.tgz")
-  if(ANDROID_ABI MATCHES "arm64-v8a") 
-    set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-android-${ANDROID_ABI}-fp16-latest-dev.tgz")
-  endif()  
-else() # Linux
-  if(CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "aarch64")
-    set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-linux-arm64-20221209.tgz")
-  else()
-    if(ENABLE_TIMVX)
-      set(PADDLELITE_URL "https://bj.bcebos.com/fastdeploy/test/lite-linux_armhf_1130.tgz")
+if(NOT PADDLELITE_URL)
+  if(WIN32 OR APPLE OR IOS)
+    message(FATAL_ERROR "Doesn't support windows/mac/ios platform with backend Paddle Lite now.")
+  elseif(ANDROID)
+    set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-android-${ANDROID_ABI}-latest-dev.tgz")
+    if(ANDROID_ABI MATCHES "arm64-v8a") 
+      set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-android-${ANDROID_ABI}-fp16-latest-dev.tgz")
+    endif()  
+  else() # Linux
+    if(CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "aarch64")
+      set(PADDLELITE_URL "${PADDLELITE_URL_PREFIX}/lite-linux-arm64-20221209.tgz")
     else()
-      message(FATAL_ERROR "Only support Linux aarch64 or ENABLE_TIMVX now, x64 is not supported with backend Paddle Lite.")
-    endif()
+        message(FATAL_ERROR "Only support Linux aarch64 now, x64 is not supported with backend Paddle Lite.")
+      endif()
   endif()
 endif()
 
diff --git a/cmake/timvx.cmake b/cmake/timvx.cmake
index c6a7d54d2..973face96 100755
--- a/cmake/timvx.cmake
+++ b/cmake/timvx.cmake
@@ -1,54 +1,45 @@
-if (NOT DEFINED CMAKE_SYSTEM_PROCESSOR)
-    set(CMAKE_SYSTEM_NAME Linux)
-    set(CMAKE_SYSTEM_PROCESSOR arm)
-    set(CMAKE_C_COMPILER "arm-linux-gnueabihf-gcc")
-    set(CMAKE_CXX_COMPILER "arm-linux-gnueabihf-g++")
-    set(CMAKE_CXX_FLAGS "-march=armv7-a -mfloat-abi=hard -mfpu=neon-vfpv4 ${CMAKE_CXX_FLAGS}")
-    set(CMAKE_C_FLAGS "-march=armv7-a -mfloat-abi=hard -mfpu=neon-vfpv4 ${CMAKE_C_FLAGS}" )
-    set(CMAKE_BUILD_TYPE MinSizeRel)
-else()
-    if(NOT ${ENABLE_LITE_BACKEND})
-        message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_LITE_BACKEND=ON")
-        set(ENABLE_LITE_BACKEND ON)
-    endif()
-    if(${ENABLE_PADDLE_FRONTEND})
-        message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_PADDLE_FRONTEND=OFF")
-        set(ENABLE_PADDLE_FRONTEND OFF)
-    endif()
-    if(${ENABLE_ORT_BACKEND})
-        message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_ORT_BACKEND=OFF")
-        set(ENABLE_ORT_BACKEND OFF)
-    endif()
-    if(${ENABLE_PADDLE_BACKEND})
-        message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_PADDLE_BACKEND=OFF")
-        set(ENABLE_PADDLE_BACKEND OFF)
-    endif()
-    if(${ENABLE_OPENVINO_BACKEND})
-        message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_OPENVINO_BACKEND=OFF")
-        set(ENABLE_OPENVINO_BACKEND OFF)
-    endif()
-    if(${ENABLE_TRT_BACKEND})
-        message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_TRT_BACKEND=OFF")
-        set(ENABLE_TRT_BACKEND OFF)
-    endif()
 
-    if(${WITH_GPU})
-        message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DWITH_GPU=OFF")
-        set(WITH_GPU OFF)
-    endif()
-
-    if(${ENABLE_OPENCV_CUDA})
-        message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_OPENCV_CUDA=OFF") 
-        set(ENABLE_OPENCV_CUDA OFF) 
-    endif()
-
-    if(${ENABLE_TEXT})
-        set(ENABLE_TEXT OFF CACHE BOOL "Force ENABLE_TEXT OFF" FORCE)
-        message(STATUS "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_TEXT=OFF")
-    endif()
-    if (DEFINED CMAKE_INSTALL_PREFIX)
-        install(FILES ${PROJECT_SOURCE_DIR}/cmake/timvx.cmake DESTINATION ${CMAKE_INSTALL_PREFIX})
-    endif()
+if(NOT ${ENABLE_LITE_BACKEND})
+    message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_LITE_BACKEND=ON")
+    set(ENABLE_LITE_BACKEND ON)
+endif()
+if(${ENABLE_PADDLE_FRONTEND})
+    message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_PADDLE_FRONTEND=OFF")
+    set(ENABLE_PADDLE_FRONTEND OFF)
+endif()
+if(${ENABLE_ORT_BACKEND})
+    message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_ORT_BACKEND=OFF")
+    set(ENABLE_ORT_BACKEND OFF)
+endif()
+if(${ENABLE_PADDLE_BACKEND})
+    message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_PADDLE_BACKEND=OFF")
+    set(ENABLE_PADDLE_BACKEND OFF)
+endif()
+if(${ENABLE_OPENVINO_BACKEND})
+    message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_OPENVINO_BACKEND=OFF")
+    set(ENABLE_OPENVINO_BACKEND OFF)
+endif()
+if(${ENABLE_TRT_BACKEND})
+    message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_TRT_BACKEND=OFF")
+    set(ENABLE_TRT_BACKEND OFF)
 endif()
 
+if(${WITH_GPU})
+    message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DWITH_GPU=OFF")
+    set(WITH_GPU OFF)
+endif()
+
+if(${ENABLE_OPENCV_CUDA})
+    message(WARNING "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_OPENCV_CUDA=OFF") 
+    set(ENABLE_OPENCV_CUDA OFF) 
+endif()
+
+if(${ENABLE_TEXT})
+    set(ENABLE_TEXT OFF CACHE BOOL "Force ENABLE_TEXT OFF" FORCE)
+    message(STATUS "While compiling with -DWITH_TIMVX=ON, will force to set -DENABLE_TEXT=OFF")
+endif()
+
+install(FILES ${PROJECT_SOURCE_DIR}/cmake/timvx.cmake DESTINATION ${CMAKE_INSTALL_PREFIX})
+install(FILES ${PROJECT_SOURCE_DIR}/cmake/toolchain.cmake DESTINATION ${CMAKE_INSTALL_PREFIX})
+
 
diff --git a/cmake/toolchain.cmake b/cmake/toolchain.cmake
new file mode 100755
index 000000000..4b3485748
--- /dev/null
+++ b/cmake/toolchain.cmake
@@ -0,0 +1,38 @@
+if (DEFINED TARGET_ABI)
+    set(CMAKE_SYSTEM_NAME Linux)
+    set(CMAKE_BUILD_TYPE MinSizeRel)
+    if(${TARGET_ABI} MATCHES "armhf")
+        set(CMAKE_SYSTEM_PROCESSOR arm)
+        set(CMAKE_C_COMPILER "arm-linux-gnueabihf-gcc")
+        set(CMAKE_CXX_COMPILER "arm-linux-gnueabihf-g++")
+        set(CMAKE_CXX_FLAGS "-march=armv7-a -mfloat-abi=hard -mfpu=neon-vfpv4 ${CMAKE_CXX_FLAGS}")
+        set(CMAKE_C_FLAGS "-march=armv7-a -mfloat-abi=hard -mfpu=neon-vfpv4 ${CMAKE_C_FLAGS}" )
+        set(OPENCV_URL "https://bj.bcebos.com/fastdeploy/third_libs/opencv-linux-armv7hf-4.6.0.tgz")
+        set(OPENCV_FILENAME "opencv-linux-armv7hf-4.6.0")
+        if(WITH_TIMVX)
+            set(PADDLELITE_URL "https://bj.bcebos.com/fastdeploy/third_libs/lite-linux-armhf-timvx-1130.tgz")
+        else()
+            message(STATUS "PADDLELITE_URL will be configured if WITH_TIMVX=ON.")
+        endif()
+        set(THIRD_PARTY_PATH ${CMAKE_CURRENT_BINARY_DIR}/third_libs)
+        set(OpenCV_DIR ${THIRD_PARTY_PATH}/install/opencv/lib/cmake/opencv4)
+    elseif(${TARGET_ABI} MATCHES "arm64")
+        set(CMAKE_SYSTEM_PROCESSOR aarch64)
+        set(CMAKE_C_COMPILER "aarch64-linux-gnu-gcc")
+        set(CMAKE_CXX_COMPILER "aarch64-linux-gnu-g++")
+        set(CMAKE_CXX_FLAGS "-march=armv8-a ${CMAKE_CXX_FLAGS}")
+        set(CMAKE_C_FLAGS "-march=armv8-a ${CMAKE_C_FLAGS}")
+        set(OPENCV_URL "https://bj.bcebos.com/fastdeploy/third_libs/opencv-linux-aarch64-4.6.0.tgz")
+        set(OPENCV_FILENAME "opencv-linux-aarch64-4.6.0")
+        if(WITH_TIMVX)
+            set(PADDLELITE_URL "https://bj.bcebos.com/fastdeploy/third_libs/lite-linux-aarch64-timvx-20221209.tgz")
+        else()
+            set(PADDLELITE_URL "https://bj.bcebos.com/fastdeploy/third_libs/lite-linux-arm64-20221209.tgz")
+        endif()
+        set(THIRD_PARTY_PATH ${CMAKE_CURRENT_BINARY_DIR}/third_libs)
+        set(OpenCV_DIR ${THIRD_PARTY_PATH}/install/opencv/lib/cmake/opencv4)
+    else()
+        message(FATAL_ERROR "When cross-compiling, please set the -DTARGET_ABI to arm64 or armhf.")
+    endif()
+endif()
+
diff --git a/docs/cn/build_and_install/README.md b/docs/cn/build_and_install/README.md
index 8be1f745a..7ec07c7b8 100755
--- a/docs/cn/build_and_install/README.md
+++ b/docs/cn/build_and_install/README.md
@@ -12,6 +12,7 @@
 - [Jetson部署环境](jetson.md)
 - [Android平台部署环境](android.md)
 - [瑞芯微RV1126部署环境](rv1126.md)
+- [晶晨A311D部署环境](a311d.md)
 
 
 ## FastDeploy编译选项说明
@@ -22,7 +23,7 @@
 | ENABLE_PADDLE_BACKEND   | 默认OFF，是否编译集成Paddle Inference后端(CPU/GPU上推荐打开)                              |  
 | ENABLE_LITE_BACKEND     | 默认OFF，是否编译集成Paddle Lite后端(编译Android库时需要设置为ON)                             |
 | ENABLE_RKNPU2_BACKEND   | 默认OFF，是否编译集成RKNPU2后端(RK3588/RK3568/RK3566上推荐打开)                           |
-| ENABLE_TIMVX            | 默认OFF，需要在RV1126/RV1109上部署时，需设置为ON                                          |
+| WITH_TIMVX            | 默认OFF，需要在RV1126/RV1109/A311D上部署时，需设置为ON                                   |
 | ENABLE_TRT_BACKEND      | 默认OFF，是否编译集成TensorRT后端(GPU上推荐打开)                                          |
 | ENABLE_OPENVINO_BACKEND | 默认OFF，是否编译集成OpenVINO后端(CPU上推荐打开)                                          |
 | ENABLE_VISION           | 默认OFF，是否编译集成视觉模型的部署模块                                                     |
diff --git a/docs/cn/build_and_install/a311d.md b/docs/cn/build_and_install/a311d.md
new file mode 100755
index 000000000..4b3773f0d
--- /dev/null
+++ b/docs/cn/build_and_install/a311d.md
@@ -0,0 +1,107 @@
+# 晶晨 A311D 部署环境编译安装
+
+FastDeploy 基于 Paddle-Lite 后端支持在晶晨 NPU 上进行部署推理。
+更多详细的信息请参考：[PaddleLite部署示例](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html)。
+
+本文档介绍如何编译基于 PaddleLite 的 C++ FastDeploy 交叉编译库。
+
+相关编译选项说明如下：  
+|编译选项|默认值|说明|备注|  
+|:---|:---|:---|:---|  
+|ENABLE_LITE_BACKEND|OFF|编译A311D部署库时需要设置为ON| - |
+|WITH_TIMVX|OFF|编译A311D部署库时需要设置为ON| - |
+
+更多编译选项请参考[FastDeploy编译选项说明](./README.md)
+
+## 交叉编译环境搭建
+
+### 宿主机环境需求  
+- os：Ubuntu == 16.04
+- cmake： version >= 3.10.0  
+
+### 环境搭建
+可以进入 FastDeploy/tools/timvx 目录，使用如下命令一键安装：
+```bash
+cd FastDeploy/tools/timvx
+bash install.sh
+```
+也可以按照如下命令安装：
+```bash
+ # 1. Install basic software
+apt update
+apt-get install -y --no-install-recommends \
+  gcc g++ git make wget python unzip
+
+# 2. Install arm gcc toolchains
+apt-get install -y --no-install-recommends \
+  g++-arm-linux-gnueabi gcc-arm-linux-gnueabi \
+  g++-arm-linux-gnueabihf gcc-arm-linux-gnueabihf \
+  gcc-aarch64-linux-gnu g++-aarch64-linux-gnu
+
+# 3. Install cmake 3.10 or above
+wget -c https://mms-res.cdn.bcebos.com/cmake-3.10.3-Linux-x86_64.tar.gz && \
+  tar xzf cmake-3.10.3-Linux-x86_64.tar.gz && \
+  mv cmake-3.10.3-Linux-x86_64 /opt/cmake-3.10 && \
+  ln -s /opt/cmake-3.10/bin/cmake /usr/bin/cmake && \
+  ln -s /opt/cmake-3.10/bin/ccmake /usr/bin/ccmake
+```
+
+## 基于 PaddleLite 的 FastDeploy 交叉编译库编译
+搭建好交叉编译环境之后，编译命令如下：
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with A311D toolchain
+cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/toolchain.cmake \
+      -DWITH_TIMVX=ON  \
+      -DTARGET_ABI=arm64 \
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-tmivx \
+      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
+      -Wno-dev ..
+
+# Build FastDeploy A311D C++ SDK
+make -j8
+make install
+```  
+编译完成之后，会生成 fastdeploy-tmivx 目录，表示基于 PadddleLite TIM-VX 的 FastDeploy 库编译完成。
+
+## 准备设备运行环境
+部署前要保证晶晨 Linux Kernel NPU 驱动 galcore.so 版本及所适用的芯片型号与依赖库保持一致，在部署前，请登录开发板，并通过命令行输入以下命令查询 NPU 驱动版本，晶晨建议的驱动版本为：6.4.4.3
+```bash
+dmesg | grep Galcore
+```  
+
+如果当前版本不符合上述，请用户仔细阅读以下内容，以保证底层 NPU 驱动环境正确。
+
+有两种方式可以修改当前的 NPU 驱动版本：
+1. 手动替换 NPU 驱动版本。（推荐）
+2. 刷机，刷取 NPU 驱动版本符合要求的固件。
+
+### 手动替换 NPU 驱动版本
+1. 使用如下命令下载解压 PaddleLite demo，其中提供了现成的驱动文件
+```bash
+wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
+tar -xf PaddleLite-generic-demo.tar.gz
+```
+2. 使用 `uname -a` 查看 `Linux Kernel` 版本，确定为 `Linux` 系统 4.19.111 版本，
+3. 将 `PaddleLite-generic-demo/libs/PaddleLite/linux/arm64/lib/verisilicon_timvx/viv_sdk_6_4_4_3/lib/a311d/4.9.113` 路径下的 `galcore.ko` 上传至开发板。
+
+4. 登录开发板，命令行输入 `sudo rmmod galcore` 来卸载原始驱动，输入 `sudo insmod galcore.ko` 来加载传上设备的驱动。（是否需要 sudo 根据开发板实际情况，部分 adb 链接的设备请提前 adb root）。此步骤如果操作失败，请跳转至方法 2。
+5. 在开发板中输入 `dmesg | grep Galcore` 查询 NPU 驱动版本，确定为：6.4.4.3
+
+### 刷机
+根据具体的开发板型号，向开发板卖家或官网客服索要 6.4.4.3 版本 NPU 驱动对应的固件和刷机方法。
+
+更多细节请参考：[PaddleLite准备设备环境](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html#zhunbeishebeihuanjing)
+
+## 基于 FastDeploy 在 A311D 上的部署示例
+1. A311D 上部署 PaddleClas 分类模型请参考：[PaddleClas 分类模型在 A311D 上的 C++ 部署示例](../../../examples/vision/classification/paddleclas/a311d/README.md)
+
+2. A311D 上部署 PPYOLOE 检测模型请参考：[PPYOLOE 检测模型在 A311D 上的 C++ 部署示例](../../../examples/vision/detection/paddledetection/a311d/README.md)
+
+3. A311D 上部署 YOLOv5 检测模型请参考：[YOLOv5 检测模型在 A311D 上的 C++ 部署示例](../../../examples/vision/detection/yolov5/a311d/README.md)
+
+4. A311D 上部署 PP-LiteSeg 分割模型请参考：[PP-LiteSeg 分割模型在 A311D 上的 C++ 部署示例](../../../examples/vision/segmentation/paddleseg/a311d/README.md)
diff --git a/docs/cn/build_and_install/rv1126.md b/docs/cn/build_and_install/rv1126.md
index f3cd4ed6a..ff0050715 100755
--- a/docs/cn/build_and_install/rv1126.md
+++ b/docs/cn/build_and_install/rv1126.md
@@ -9,7 +9,7 @@ FastDeploy基于 Paddle-Lite 后端支持在瑞芯微（Rockchip）Soc 上进行
 |编译选项|默认值|说明|备注|  
 |:---|:---|:---|:---|  
 |ENABLE_LITE_BACKEND|OFF|编译RK库时需要设置为ON| - |
-|ENABLE_TIMVX|OFF|编译RK库时需要设置为ON| - |
+|WITH_TIMVX|OFF|编译RK库时需要设置为ON| - |
 
 更多编译选项请参考[FastDeploy编译选项说明](./README.md)
 
@@ -20,6 +20,12 @@ FastDeploy基于 Paddle-Lite 后端支持在瑞芯微（Rockchip）Soc 上进行
 - cmake： version >= 3.10.0  
 
 ### 环境搭建
+可以进入 FastDeploy/tools/timvx 目录，使用如下命令一键安装：
+```bash
+cd FastDeploy/tools/timvx
+bash install.sh
+```
+也可以按照如下命令安装：
 ```bash
  # 1. Install basic software
 apt update
@@ -49,8 +55,9 @@ cd FastDeploy
 mkdir build && cd build
 
 # CMake configuration with RK toolchain
-cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/timvx.cmake \
-      -DENABLE_TIMVX=ON  \
+cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/toolchain.cmake \
+      -DWITH_TIMVX=ON  \
+      -DTARGET_ABI=armhf \
       -DCMAKE_INSTALL_PREFIX=fastdeploy-tmivx \
       -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
       -Wno-dev ..
diff --git a/examples/vision/classification/paddleclas/a311d/README.md b/examples/vision/classification/paddleclas/a311d/README.md
new file mode 100755
index 000000000..0fb75854a
--- /dev/null
+++ b/examples/vision/classification/paddleclas/a311d/README.md
@@ -0,0 +1,11 @@
+# PaddleClas 量化模型在 A311D 上的部署
+目前 FastDeploy 已经支持基于 PaddleLite 部署 PaddleClas 量化模型到 A311D 上。
+
+模型的量化和量化模型的下载请参考：[模型量化](../quantize/README.md)
+
+
+## 详细部署文档
+
+在 A311D 上只支持 C++ 的部署。
+
+- [C++部署](cpp)
diff --git a/examples/vision/classification/paddleclas/a311d/cpp/CMakeLists.txt b/examples/vision/classification/paddleclas/a311d/cpp/CMakeLists.txt
new file mode 100755
index 000000000..baaf8331f
--- /dev/null
+++ b/examples/vision/classification/paddleclas/a311d/cpp/CMakeLists.txt
@@ -0,0 +1,38 @@
+PROJECT(infer_demo C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+# 指定下载解压后的fastdeploy库路径
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+
+# 添加FastDeploy依赖头文件
+include_directories(${FASTDEPLOY_INCS})
+include_directories(${FastDeploy_INCLUDE_DIRS})
+
+add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
+# 添加FastDeploy库依赖
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS})
+
+set(CMAKE_INSTALL_PREFIX ${CMAKE_SOURCE_DIR}/build/install)
+
+install(TARGETS infer_demo DESTINATION ./)
+
+install(DIRECTORY models DESTINATION ./)
+install(DIRECTORY images DESTINATION ./)
+# install(DIRECTORY run_with_adb.sh DESTINATION ./)
+
+file(GLOB FASTDEPLOY_LIBS ${FASTDEPLOY_INSTALL_DIR}/lib/*)
+install(PROGRAMS ${FASTDEPLOY_LIBS} DESTINATION lib)
+
+file(GLOB OPENCV_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/opencv/lib/lib*)
+install(PROGRAMS ${OPENCV_LIBS} DESTINATION lib)
+
+file(GLOB PADDLELITE_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddlelite/lib/lib*)
+install(PROGRAMS ${PADDLELITE_LIBS} DESTINATION lib)
+
+file(GLOB TIMVX_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddlelite/lib/verisilicon_timvx/*)
+install(PROGRAMS ${TIMVX_LIBS} DESTINATION lib)
+
+file(GLOB ADB_TOOLS run_with_adb.sh)
+install(PROGRAMS ${ADB_TOOLS} DESTINATION ./)
diff --git a/examples/vision/classification/paddleclas/a311d/cpp/README.md b/examples/vision/classification/paddleclas/a311d/cpp/README.md
new file mode 100755
index 000000000..c1d926c9a
--- /dev/null
+++ b/examples/vision/classification/paddleclas/a311d/cpp/README.md
@@ -0,0 +1,53 @@
+# PaddleClas A311D 开发板 C++ 部署示例
+本目录下提供的 `infer.cc`，可以帮助用户快速完成 PaddleClas 量化模型在 A311D 上的部署推理加速。
+
+## 部署准备
+### FastDeploy 交叉编译环境准备
+- 1. 软硬件环境满足要求，以及交叉编译环境的准备，请参考：[FastDeploy 交叉编译环境准备](../../../../../../docs/cn/build_and_install/a311d.md#交叉编译环境搭建)  
+
+### 量化模型准备
+- 1. 用户可以直接使用由 FastDeploy 提供的量化模型进行部署。
+- 2. 用户可以使用 FastDeploy 提供的[一键模型自动化压缩工具](../../../../../../tools/common_tools/auto_compression/)，自行进行模型量化, 并使用产出的量化模型进行部署。(注意: 推理量化后的分类模型仍然需要FP32模型文件夹下的inference_cls.yaml文件, 自行量化的模型文件夹内不包含此 yaml 文件, 用户从 FP32 模型文件夹下复制此 yaml 文件到量化后的模型文件夹内即可.)
+- 更多量化相关相关信息可查阅[模型量化](../../quantize/README.md)
+
+## 在 A311D 上部署量化后的 ResNet50_Vd 分类模型
+请按照以下步骤完成在 A311D 上部署 ResNet50_Vd 量化模型：
+1. 交叉编译编译 FastDeploy 库，具体请参考：[交叉编译 FastDeploy](../../../../../../docs/cn/build_and_install/a311d.md#基于-paddlelite-的-fastdeploy-交叉编译库编译)
+
+2. 将编译后的库拷贝到当前目录，可使用如下命令：
+```bash
+cp -r FastDeploy/build/fastdeploy-tmivx/ FastDeploy/examples/vision/classification/paddleclas/a311d/cpp/
+```
+
+3. 在当前路径下载部署所需的模型和示例图片：
+```bash
+mkdir models && mkdir images
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz
+tar -xvf ResNet50_vd_infer.tgz
+cp -r ResNet50_vd_infer models
+wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
+cp -r ILSVRC2012_val_00000010.jpeg images
+```
+
+4. 编译部署示例，可使入如下命令：
+```bash
+mkdir build && cd build
+cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/toolchain.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx -DTARGET_ABI=arm64 ..
+make -j8
+make install
+# 成功编译之后，会生成 install 文件夹，里面有一个运行 demo 和部署所需的库
+```
+
+5. 基于 adb 工具部署 ResNet50_vd 分类模型到晶晨 A311D，可使用如下命令：
+```bash
+# 进入 install 目录
+cd FastDeploy/examples/vision/classification/paddleclas/a311d/cpp/build/install/
+# 如下命令表示：bash run_with_adb.sh 需要运行的demo 模型路径 图片路径 设备的DEVICE_ID
+bash run_with_adb.sh infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg $DEVICE_ID
+```
+
+部署成功后运行结果如下：
+
+<img width="640" src="https://user-images.githubusercontent.com/30516196/200767389-26519e50-9e4f-4fe1-8d52-260718f73476.png">
+
+需要特别注意的是，在 A311D 上部署的模型需要是量化后的模型，模型的量化请参考：[模型量化](../../../../../../docs/cn/quantize.md)
diff --git a/examples/vision/classification/paddleclas/a311d/cpp/infer.cc b/examples/vision/classification/paddleclas/a311d/cpp/infer.cc
new file mode 100755
index 000000000..140311eec
--- /dev/null
+++ b/examples/vision/classification/paddleclas/a311d/cpp/infer.cc
@@ -0,0 +1,60 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#include <string>
+#include "fastdeploy/vision.h"
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void InitAndInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "inference.pdmodel";
+  auto params_file = model_dir + sep + "inference.pdiparams";
+  auto config_file = model_dir + sep + "inference_cls.yaml";
+  
+  fastdeploy::RuntimeOption option;
+  option.UseTimVX();
+
+  auto model = fastdeploy::vision::classification::PaddleClasModel(
+      model_file, params_file, config_file, option);
+
+  assert(model.Initialized());
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::ClassifyResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 3) {
+    std::cout << "Usage: infer_demo path/to/quant_model "
+                 "path/to/image "
+                 "e.g ./infer_demo ./ResNet50_vd_quant ./test.jpeg"
+              << std::endl;
+    return -1;
+  }
+
+  std::string model_dir = argv[1];
+  std::string test_image = argv[2];
+  InitAndInfer(model_dir, test_image);
+  return 0;
+}
diff --git a/examples/vision/classification/paddleclas/a311d/cpp/run_with_adb.sh b/examples/vision/classification/paddleclas/a311d/cpp/run_with_adb.sh
new file mode 100755
index 000000000..aacaed4c5
--- /dev/null
+++ b/examples/vision/classification/paddleclas/a311d/cpp/run_with_adb.sh
@@ -0,0 +1,47 @@
+#!/bin/bash
+HOST_SPACE=${PWD}
+echo ${HOST_SPACE}
+WORK_SPACE=/data/local/tmp/test
+
+# The first parameter represents the demo name
+DEMO_NAME=image_classification_demo
+if [ -n "$1" ]; then
+  DEMO_NAME=$1
+fi
+
+# The second parameter represents the model name
+MODEL_NAME=mobilenet_v1_fp32_224
+if [ -n "$2" ]; then
+  MODEL_NAME=$2
+fi
+
+# The third parameter indicates the name of the image to be tested
+IMAGE_NAME=0001.jpg
+if [ -n "$3" ]; then
+  IMAGE_NAME=$3
+fi
+
+# The fourth parameter represents the ID of the device
+ADB_DEVICE_NAME=
+if [ -n "$4" ]; then
+  ADB_DEVICE_NAME="-s $4"
+fi
+
+# Set the environment variables required during the running process
+EXPORT_ENVIRONMENT_VARIABLES="export GLOG_v=5; export VIV_VX_ENABLE_GRAPH_TRANSFORM=-pcq:1; export VIV_VX_SET_PER_CHANNEL_ENTROPY=100; export TIMVX_BATCHNORM_FUSION_MAX_ALLOWED_QUANT_SCALE_DEVIATION=300000; export VSI_NN_LOG_LEVEL=5;"
+
+EXPORT_ENVIRONMENT_VARIABLES="${EXPORT_ENVIRONMENT_VARIABLES}export LD_LIBRARY_PATH=${WORK_SPACE}/lib:\$LD_LIBRARY_PATH;"
+
+# Please install adb, and DON'T run this in the docker.
+set -e
+adb $ADB_DEVICE_NAME shell "rm -rf $WORK_SPACE"
+adb $ADB_DEVICE_NAME shell "mkdir -p $WORK_SPACE"
+
+# Upload the demo, librarys, model and test images to the device
+adb $ADB_DEVICE_NAME push ${HOST_SPACE}/lib $WORK_SPACE
+adb $ADB_DEVICE_NAME push ${HOST_SPACE}/${DEMO_NAME} $WORK_SPACE
+adb $ADB_DEVICE_NAME push models $WORK_SPACE
+adb $ADB_DEVICE_NAME push images $WORK_SPACE
+
+# Execute the deployment demo
+adb $ADB_DEVICE_NAME shell "cd $WORK_SPACE; ${EXPORT_ENVIRONMENT_VARIABLES} chmod +x ./${DEMO_NAME}; ./${DEMO_NAME} ./models/${MODEL_NAME} ./images/$IMAGE_NAME"
diff --git a/examples/vision/classification/paddleclas/rv1126/cpp/README.md b/examples/vision/classification/paddleclas/rv1126/cpp/README.md
index feaba462f..b41fecace 100755
--- a/examples/vision/classification/paddleclas/rv1126/cpp/README.md
+++ b/examples/vision/classification/paddleclas/rv1126/cpp/README.md
@@ -32,7 +32,7 @@ cp -r ILSVRC2012_val_00000010.jpeg images
 4. 编译部署示例，可使入如下命令：
 ```bash
 mkdir build && cd build
-cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/timvx.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx ..
+cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/toolchain.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx -DTARGET_ABI=armhf ..
 make -j8
 make install
 # 成功编译之后，会生成 install 文件夹，里面有一个运行 demo 和部署所需的库
diff --git a/examples/vision/classification/paddleclas/rv1126/cpp/infer.cc b/examples/vision/classification/paddleclas/rv1126/cpp/infer.cc
index c89510342..140311eec 100755
--- a/examples/vision/classification/paddleclas/rv1126/cpp/infer.cc
+++ b/examples/vision/classification/paddleclas/rv1126/cpp/infer.cc
@@ -48,7 +48,6 @@ int main(int argc, char* argv[]) {
   if (argc < 3) {
     std::cout << "Usage: infer_demo path/to/quant_model "
                  "path/to/image "
-                 "run_option, "
                  "e.g ./infer_demo ./ResNet50_vd_quant ./test.jpeg"
               << std::endl;
     return -1;
diff --git a/examples/vision/detection/paddledetection/a311d/README.md b/examples/vision/detection/paddledetection/a311d/README.md
new file mode 100755
index 000000000..e5ba7376d
--- /dev/null
+++ b/examples/vision/detection/paddledetection/a311d/README.md
@@ -0,0 +1,11 @@
+# PP-YOLOE  量化模型在 A311D 上的部署
+目前 FastDeploy 已经支持基于 PaddleLite 部署 PP-YOLOE  量化模型到 A311D 上。
+
+模型的量化和量化模型的下载请参考：[模型量化](../quantize/README.md)
+
+
+## 详细部署文档
+
+在 A311D 上只支持 C++ 的部署。
+
+- [C++部署](cpp)
diff --git a/examples/vision/detection/paddledetection/a311d/cpp/CMakeLists.txt b/examples/vision/detection/paddledetection/a311d/cpp/CMakeLists.txt
new file mode 100755
index 000000000..7a145177e
--- /dev/null
+++ b/examples/vision/detection/paddledetection/a311d/cpp/CMakeLists.txt
@@ -0,0 +1,38 @@
+PROJECT(infer_demo C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+# 指定下载解压后的fastdeploy库路径
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+
+# 添加FastDeploy依赖头文件
+include_directories(${FASTDEPLOY_INCS})
+include_directories(${FastDeploy_INCLUDE_DIRS})
+
+add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer_ppyoloe.cc)
+# 添加FastDeploy库依赖
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS})
+
+set(CMAKE_INSTALL_PREFIX ${CMAKE_SOURCE_DIR}/build/install)
+
+install(TARGETS infer_demo DESTINATION ./)
+
+install(DIRECTORY models DESTINATION ./)
+install(DIRECTORY images DESTINATION ./)
+# install(DIRECTORY run_with_adb.sh DESTINATION ./)
+
+file(GLOB FASTDEPLOY_LIBS ${FASTDEPLOY_INSTALL_DIR}/lib/*)
+install(PROGRAMS ${FASTDEPLOY_LIBS} DESTINATION lib)
+
+file(GLOB OPENCV_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/opencv/lib/lib*)
+install(PROGRAMS ${OPENCV_LIBS} DESTINATION lib)
+
+file(GLOB PADDLELITE_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddlelite/lib/lib*)
+install(PROGRAMS ${PADDLELITE_LIBS} DESTINATION lib)
+
+file(GLOB TIMVX_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddlelite/lib/verisilicon_timvx/*)
+install(PROGRAMS ${TIMVX_LIBS} DESTINATION lib)
+
+file(GLOB ADB_TOOLS run_with_adb.sh)
+install(PROGRAMS ${ADB_TOOLS} DESTINATION ./)
diff --git a/examples/vision/detection/paddledetection/a311d/cpp/README.md b/examples/vision/detection/paddledetection/a311d/cpp/README.md
new file mode 100755
index 000000000..d0f4ff63a
--- /dev/null
+++ b/examples/vision/detection/paddledetection/a311d/cpp/README.md
@@ -0,0 +1,55 @@
+# PP-YOLOE  量化模型 C++ 部署示例
+
+本目录下提供的 `infer.cc`，可以帮助用户快速完成 PP-YOLOE 量化模型在 A311D 上的部署推理加速。
+
+## 部署准备
+### FastDeploy 交叉编译环境准备
+- 1. 软硬件环境满足要求，以及交叉编译环境的准备，请参考：[FastDeploy 交叉编译环境准备](../../../../../../docs/cn/build_and_install/a311d.md#交叉编译环境搭建)  
+
+### 模型准备
+- 1. 用户可以直接使用由 FastDeploy 提供的量化模型进行部署。
+- 2. 用户可以先使用 PaddleDetection 自行导出 Float32 模型，注意导出模型模型时设置参数：use_shared_conv=False，更多细节请参考：[PP-YOLOE](https://github.com/PaddlePaddle/PaddleDetection/tree/release/2.4/configs/ppyoloe)
+- 3. 用户可以使用 FastDeploy 提供的[一键模型自动化压缩工具](../../../../../../tools/common_tools/auto_compression/)，自行进行模型量化, 并使用产出的量化模型进行部署。（注意: 推理量化后的检测模型仍然需要FP32模型文件夹下的 infer_cfg.yml 文件，自行量化的模型文件夹内不包含此 yaml 文件，用户从 FP32 模型文件夹下复制此yaml文件到量化后的模型文件夹内即可。）
+- 更多量化相关相关信息可查阅[模型量化](../../quantize/README.md)
+
+## 在 A311D 上部署量化后的 PP-YOLOE  检测模型
+请按照以下步骤完成在 A311D 上部署 PP-YOLOE  量化模型：
+1. 交叉编译编译 FastDeploy 库，具体请参考：[交叉编译 FastDeploy](../../../../../../docs/cn/build_and_install/a311d.md#基于-paddlelite-的-fastdeploy-交叉编译库编译)
+
+2. 将编译后的库拷贝到当前目录，可使用如下命令：
+```bash
+cp -r FastDeploy/build/fastdeploy-tmivx/ FastDeploy/examples/vision/detection/yolov5/a311d/cpp
+```
+
+3. 在当前路径下载部署所需的模型和示例图片：
+```bash
+mkdir models && mkdir images
+wget https://bj.bcebos.com/fastdeploy/models/ppyoloe_noshare_qat.tar.gz
+tar -xvf ppyoloe_noshare_qat.tar.gz
+cp -r ppyoloe_noshare_qat models
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+cp -r 000000014439.jpg images
+```
+
+4. 编译部署示例，可使入如下命令：
+```bash
+mkdir build && cd build
+cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/toolchain.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx -DTARGET_ABI=arm64 ..
+make -j8
+make install
+# 成功编译之后，会生成 install 文件夹，里面有一个运行 demo 和部署所需的库
+```
+
+5. 基于 adb 工具部署 PP-YOLOE  检测模型到晶晨 A311D
+```bash
+# 进入 install 目录
+cd FastDeploy/examples/vision/detection/paddledetection/a311d/cpp/build/install/
+# 如下命令表示：bash run_with_adb.sh 需要运行的demo 模型路径 图片路径 设备的DEVICE_ID
+bash run_with_adb.sh infer_demo ppyoloe_noshare_qat 000000014439.jpg $DEVICE_ID
+```
+
+部署成功后运行结果如下：
+
+<img width="640" src="https://user-images.githubusercontent.com/30516196/203708564-43c49485-9b48-4eb2-8fe7-0fa517979fff.png">
+
+需要特别注意的是，在 A311D 上部署的模型需要是量化后的模型，模型的量化请参考：[模型量化](../../../../../../docs/cn/quantize.md)
diff --git a/examples/vision/detection/paddledetection/a311d/cpp/infer_ppyoloe.cc b/examples/vision/detection/paddledetection/a311d/cpp/infer_ppyoloe.cc
new file mode 100755
index 000000000..609a41d4b
--- /dev/null
+++ b/examples/vision/detection/paddledetection/a311d/cpp/infer_ppyoloe.cc
@@ -0,0 +1,65 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void InitAndInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+  auto subgraph_file = model_dir + sep + "subgraph.txt";
+
+  fastdeploy::RuntimeOption option;
+  option.UseTimVX();
+  option.SetLiteSubgraphPartitionPath(subgraph_file);
+
+  auto model = fastdeploy::vision::detection::PPYOLOE(model_file, params_file,
+                                                      config_file, option);
+  assert(model.Initialized());
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 3) {
+    std::cout << "Usage: infer_demo path/to/quant_model "
+                 "path/to/image "
+                 "e.g ./infer_demo ./PPYOLOE_L_quant ./test.jpeg"
+              << std::endl;
+    return -1;
+  }
+
+  std::string model_dir = argv[1];
+  std::string test_image = argv[2];
+  InitAndInfer(model_dir, test_image);
+  return 0;
+}
diff --git a/examples/vision/detection/paddledetection/a311d/cpp/run_with_adb.sh b/examples/vision/detection/paddledetection/a311d/cpp/run_with_adb.sh
new file mode 100755
index 000000000..dd7d7b47d
--- /dev/null
+++ b/examples/vision/detection/paddledetection/a311d/cpp/run_with_adb.sh
@@ -0,0 +1,47 @@
+#!/bin/bash
+HOST_SPACE=${PWD}
+echo ${HOST_SPACE}
+WORK_SPACE=/data/local/tmp/test
+
+# The first parameter represents the demo name
+DEMO_NAME=image_classification_demo
+if [ -n "$1" ]; then
+  DEMO_NAME=$1
+fi
+
+# The second parameter represents the model name
+MODEL_NAME=mobilenet_v1_fp32_224
+if [ -n "$2" ]; then
+  MODEL_NAME=$2
+fi
+
+# The third parameter indicates the name of the image to be tested
+IMAGE_NAME=0001.jpg
+if [ -n "$3" ]; then
+  IMAGE_NAME=$3
+fi
+
+# The fourth parameter represents the ID of the device
+ADB_DEVICE_NAME=
+if [ -n "$4" ]; then
+  ADB_DEVICE_NAME="-s $4"
+fi
+
+# Set the environment variables required during the running process
+EXPORT_ENVIRONMENT_VARIABLES="export GLOG_v=5; export SUBGRAPH_ONLINE_MODE=true; export RKNPU_LOGLEVEL=5; export RKNN_LOG_LEVEL=5; ulimit -c unlimited; export VIV_VX_ENABLE_GRAPH_TRANSFORM=-pcq:1; export VIV_VX_SET_PER_CHANNEL_ENTROPY=100; export TIMVX_BATCHNORM_FUSION_MAX_ALLOWED_QUANT_SCALE_DEVIATION=300000; export VSI_NN_LOG_LEVEL=5;"
+
+EXPORT_ENVIRONMENT_VARIABLES="${EXPORT_ENVIRONMENT_VARIABLES}export LD_LIBRARY_PATH=${WORK_SPACE}/lib:\$LD_LIBRARY_PATH;"
+
+# Please install adb, and DON'T run this in the docker.
+set -e
+adb $ADB_DEVICE_NAME shell "rm -rf $WORK_SPACE"
+adb $ADB_DEVICE_NAME shell "mkdir -p $WORK_SPACE"
+
+# Upload the demo, librarys, model and test images to the device
+adb $ADB_DEVICE_NAME push ${HOST_SPACE}/lib $WORK_SPACE
+adb $ADB_DEVICE_NAME push ${HOST_SPACE}/${DEMO_NAME} $WORK_SPACE
+adb $ADB_DEVICE_NAME push models $WORK_SPACE
+adb $ADB_DEVICE_NAME push images $WORK_SPACE
+
+# Execute the deployment demo
+adb $ADB_DEVICE_NAME shell "cd $WORK_SPACE; ${EXPORT_ENVIRONMENT_VARIABLES} chmod +x ./${DEMO_NAME}; ./${DEMO_NAME} ./models/${MODEL_NAME} ./images/$IMAGE_NAME"
diff --git a/examples/vision/detection/paddledetection/rv1126/cpp/README.md b/examples/vision/detection/paddledetection/rv1126/cpp/README.md
index 5b366bd83..193a269fd 100755
--- a/examples/vision/detection/paddledetection/rv1126/cpp/README.md
+++ b/examples/vision/detection/paddledetection/rv1126/cpp/README.md
@@ -34,7 +34,7 @@ cp -r 000000014439.jpg images
 4. 编译部署示例，可使入如下命令：
 ```bash
 mkdir build && cd build
-cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/timvx.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx ..
+cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/toolchain.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx -DTARGET_ABI=armhf ..
 make -j8
 make install
 # 成功编译之后，会生成 install 文件夹，里面有一个运行 demo 和部署所需的库
diff --git a/examples/vision/detection/paddledetection/rv1126/cpp/infer_ppyoloe.cc b/examples/vision/detection/paddledetection/rv1126/cpp/infer_ppyoloe.cc
index 77368584f..609a41d4b 100755
--- a/examples/vision/detection/paddledetection/rv1126/cpp/infer_ppyoloe.cc
+++ b/examples/vision/detection/paddledetection/rv1126/cpp/infer_ppyoloe.cc
@@ -53,7 +53,6 @@ int main(int argc, char* argv[]) {
   if (argc < 3) {
     std::cout << "Usage: infer_demo path/to/quant_model "
                  "path/to/image "
-                 "run_option, "
                  "e.g ./infer_demo ./PPYOLOE_L_quant ./test.jpeg"
               << std::endl;
     return -1;
diff --git a/examples/vision/detection/yolov5/a311d/README.md b/examples/vision/detection/yolov5/a311d/README.md
new file mode 100755
index 000000000..d0bcd10a9
--- /dev/null
+++ b/examples/vision/detection/yolov5/a311d/README.md
@@ -0,0 +1,11 @@
+# YOLOv5 量化模型在 A311D 上的部署
+目前 FastDeploy 已经支持基于 PaddleLite 部署 YOLOv5 量化模型到 A311D 上。
+
+模型的量化和量化模型的下载请参考：[模型量化](../quantize/README.md)
+
+
+## 详细部署文档
+
+在 A311D 上只支持 C++ 的部署。
+
+- [C++部署](cpp)
diff --git a/examples/vision/detection/yolov5/a311d/cpp/CMakeLists.txt b/examples/vision/detection/yolov5/a311d/cpp/CMakeLists.txt
new file mode 100755
index 000000000..3c9eee38a
--- /dev/null
+++ b/examples/vision/detection/yolov5/a311d/cpp/CMakeLists.txt
@@ -0,0 +1,37 @@
+PROJECT(infer_demo C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+# 指定下载解压后的fastdeploy库路径
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+
+# 添加FastDeploy依赖头文件
+include_directories(${FASTDEPLOY_INCS})
+include_directories(${FastDeploy_INCLUDE_DIRS})
+
+add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
+# 添加FastDeploy库依赖
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS})
+
+set(CMAKE_INSTALL_PREFIX ${CMAKE_SOURCE_DIR}/build/install)
+
+install(TARGETS infer_demo DESTINATION ./)
+
+install(DIRECTORY models DESTINATION ./)
+install(DIRECTORY images DESTINATION ./)
+
+file(GLOB FASTDEPLOY_LIBS ${FASTDEPLOY_INSTALL_DIR}/lib/*)
+install(PROGRAMS ${FASTDEPLOY_LIBS} DESTINATION lib)
+
+file(GLOB OPENCV_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/opencv/lib/lib*)
+install(PROGRAMS ${OPENCV_LIBS} DESTINATION lib)
+
+file(GLOB PADDLELITE_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddlelite/lib/lib*)
+install(PROGRAMS ${PADDLELITE_LIBS} DESTINATION lib)
+
+file(GLOB TIMVX_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddlelite/lib/verisilicon_timvx/*)
+install(PROGRAMS ${TIMVX_LIBS} DESTINATION lib)
+
+file(GLOB ADB_TOOLS run_with_adb.sh)
+install(PROGRAMS ${ADB_TOOLS} DESTINATION ./)
diff --git a/examples/vision/detection/yolov5/a311d/cpp/README.md b/examples/vision/detection/yolov5/a311d/cpp/README.md
new file mode 100755
index 000000000..d47027bb0
--- /dev/null
+++ b/examples/vision/detection/yolov5/a311d/cpp/README.md
@@ -0,0 +1,54 @@
+# YOLOv5 量化模型 C++ 部署示例
+
+本目录下提供的 `infer.cc`，可以帮助用户快速完成 YOLOv5 量化模型在 A311D 上的部署推理加速。
+
+## 部署准备
+### FastDeploy 交叉编译环境准备
+- 1. 软硬件环境满足要求，以及交叉编译环境的准备，请参考：[FastDeploy 交叉编译环境准备](../../../../../../docs/cn/build_and_install/a311d.md#交叉编译环境搭建)  
+
+### 量化模型准备
+- 1. 用户可以直接使用由 FastDeploy 提供的量化模型进行部署。
+- 2. 用户可以使用 FastDeploy 提供的[一键模型自动化压缩工具](../../../../../../tools/common_tools/auto_compression/),自行进行模型量化, 并使用产出的量化模型进行部署。
+- 更多量化相关相关信息可查阅[模型量化](../../quantize/README.md)
+
+## 在 A311D 上部署量化后的 YOLOv5 检测模型
+请按照以下步骤完成在 A311D 上部署 YOLOv5 量化模型：
+1. 交叉编译编译 FastDeploy 库，具体请参考：[交叉编译 FastDeploy](../../../../../../docs/cn/build_and_install/a311d.md#基于-paddlelite-的-fastdeploy-交叉编译库编译)
+
+2. 将编译后的库拷贝到当前目录，可使用如下命令：
+```bash
+cp -r FastDeploy/build/fastdeploy-tmivx/ FastDeploy/examples/vision/detection/yolov5/a311d/cpp
+```
+
+3. 在当前路径下载部署所需的模型和示例图片：
+```bash
+mkdir models && mkdir images
+wget https://bj.bcebos.com/fastdeploy/models/yolov5s_ptq_model.tar.gz
+tar -xvf yolov5s_ptq_model.tar.gz
+cp -r yolov5s_ptq_model models
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+cp -r 000000014439.jpg images
+```
+
+4. 编译部署示例，可使入如下命令：
+```bash
+mkdir build && cd build
+cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/toolchain.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx -DTARGET_ABI=arm64 ..
+make -j8
+make install
+# 成功编译之后，会生成 install 文件夹，里面有一个运行 demo 和部署所需的库
+```
+
+5. 基于 adb 工具部署 YOLOv5 检测模型到晶晨 A311D
+```bash
+# 进入 install 目录
+cd FastDeploy/examples/vision/detection/yolov5/a311d/cpp/build/install/
+# 如下命令表示：bash run_with_adb.sh 需要运行的demo 模型路径 图片路径 设备的DEVICE_ID
+bash run_with_adb.sh infer_demo yolov5s_ptq_model 000000014439.jpg $DEVICE_ID
+```
+
+部署成功后，vis_result.jpg 保存的结果如下：
+
+<img width="640" src="https://user-images.githubusercontent.com/30516196/203706969-dd58493c-6635-4ee7-9421-41c2e0c9524b.png">
+
+需要特别注意的是，在 A311D 上部署的模型需要是量化后的模型，模型的量化请参考：[模型量化](../../../../../../docs/cn/quantize.md)
diff --git a/examples/vision/detection/yolov5/a311d/cpp/infer.cc b/examples/vision/detection/yolov5/a311d/cpp/infer.cc
new file mode 100755
index 000000000..f1cf9e8dc
--- /dev/null
+++ b/examples/vision/detection/yolov5/a311d/cpp/infer.cc
@@ -0,0 +1,64 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void InitAndInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto subgraph_file = model_dir + sep + "subgraph.txt";
+
+  fastdeploy::RuntimeOption option;
+  option.UseTimVX();
+  option.SetLiteSubgraphPartitionPath(subgraph_file);
+
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+  assert(model.Initialized());
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 3) {
+    std::cout << "Usage: infer_demo path/to/quant_model "
+                 "path/to/image "
+                 "run_option, "
+                 "e.g ./infer_demo ./yolov5s_quant ./000000014439.jpg"
+              << std::endl;
+    return -1;
+  }
+
+  std::string model_dir = argv[1];
+  std::string test_image = argv[2];
+  InitAndInfer(model_dir, test_image);
+  return 0;
+}
diff --git a/examples/vision/detection/yolov5/a311d/cpp/run_with_adb.sh b/examples/vision/detection/yolov5/a311d/cpp/run_with_adb.sh
new file mode 100755
index 000000000..aacaed4c5
--- /dev/null
+++ b/examples/vision/detection/yolov5/a311d/cpp/run_with_adb.sh
@@ -0,0 +1,47 @@
+#!/bin/bash
+HOST_SPACE=${PWD}
+echo ${HOST_SPACE}
+WORK_SPACE=/data/local/tmp/test
+
+# The first parameter represents the demo name
+DEMO_NAME=image_classification_demo
+if [ -n "$1" ]; then
+  DEMO_NAME=$1
+fi
+
+# The second parameter represents the model name
+MODEL_NAME=mobilenet_v1_fp32_224
+if [ -n "$2" ]; then
+  MODEL_NAME=$2
+fi
+
+# The third parameter indicates the name of the image to be tested
+IMAGE_NAME=0001.jpg
+if [ -n "$3" ]; then
+  IMAGE_NAME=$3
+fi
+
+# The fourth parameter represents the ID of the device
+ADB_DEVICE_NAME=
+if [ -n "$4" ]; then
+  ADB_DEVICE_NAME="-s $4"
+fi
+
+# Set the environment variables required during the running process
+EXPORT_ENVIRONMENT_VARIABLES="export GLOG_v=5; export VIV_VX_ENABLE_GRAPH_TRANSFORM=-pcq:1; export VIV_VX_SET_PER_CHANNEL_ENTROPY=100; export TIMVX_BATCHNORM_FUSION_MAX_ALLOWED_QUANT_SCALE_DEVIATION=300000; export VSI_NN_LOG_LEVEL=5;"
+
+EXPORT_ENVIRONMENT_VARIABLES="${EXPORT_ENVIRONMENT_VARIABLES}export LD_LIBRARY_PATH=${WORK_SPACE}/lib:\$LD_LIBRARY_PATH;"
+
+# Please install adb, and DON'T run this in the docker.
+set -e
+adb $ADB_DEVICE_NAME shell "rm -rf $WORK_SPACE"
+adb $ADB_DEVICE_NAME shell "mkdir -p $WORK_SPACE"
+
+# Upload the demo, librarys, model and test images to the device
+adb $ADB_DEVICE_NAME push ${HOST_SPACE}/lib $WORK_SPACE
+adb $ADB_DEVICE_NAME push ${HOST_SPACE}/${DEMO_NAME} $WORK_SPACE
+adb $ADB_DEVICE_NAME push models $WORK_SPACE
+adb $ADB_DEVICE_NAME push images $WORK_SPACE
+
+# Execute the deployment demo
+adb $ADB_DEVICE_NAME shell "cd $WORK_SPACE; ${EXPORT_ENVIRONMENT_VARIABLES} chmod +x ./${DEMO_NAME}; ./${DEMO_NAME} ./models/${MODEL_NAME} ./images/$IMAGE_NAME"
diff --git a/examples/vision/detection/yolov5/rv1126/cpp/README.md b/examples/vision/detection/yolov5/rv1126/cpp/README.md
index 9711577f2..b974a8ebe 100755
--- a/examples/vision/detection/yolov5/rv1126/cpp/README.md
+++ b/examples/vision/detection/yolov5/rv1126/cpp/README.md
@@ -33,7 +33,7 @@ cp -r 000000014439.jpg images
 4. 编译部署示例，可使入如下命令：
 ```bash
 mkdir build && cd build
-cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/timvx.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx ..
+cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/toolchain.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx -DTARGET_ABI=armhf ..
 make -j8
 make install
 # 成功编译之后，会生成 install 文件夹，里面有一个运行 demo 和部署所需的库
diff --git a/examples/vision/segmentation/paddleseg/a311d/README.md b/examples/vision/segmentation/paddleseg/a311d/README.md
new file mode 100755
index 000000000..f65172cdd
--- /dev/null
+++ b/examples/vision/segmentation/paddleseg/a311d/README.md
@@ -0,0 +1,11 @@
+# PP-LiteSeg 量化模型在 A311D 上的部署
+目前 FastDeploy 已经支持基于 PaddleLite 部署 PP-LiteSeg 量化模型到 A311D 上。
+
+模型的量化和量化模型的下载请参考：[模型量化](../quantize/README.md)
+
+
+## 详细部署文档
+
+在 A311D 上只支持 C++ 的部署。
+
+- [C++部署](cpp)
diff --git a/examples/vision/segmentation/paddleseg/a311d/cpp/CMakeLists.txt b/examples/vision/segmentation/paddleseg/a311d/cpp/CMakeLists.txt
new file mode 100755
index 000000000..baaf8331f
--- /dev/null
+++ b/examples/vision/segmentation/paddleseg/a311d/cpp/CMakeLists.txt
@@ -0,0 +1,38 @@
+PROJECT(infer_demo C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+# 指定下载解压后的fastdeploy库路径
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+
+# 添加FastDeploy依赖头文件
+include_directories(${FASTDEPLOY_INCS})
+include_directories(${FastDeploy_INCLUDE_DIRS})
+
+add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
+# 添加FastDeploy库依赖
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS})
+
+set(CMAKE_INSTALL_PREFIX ${CMAKE_SOURCE_DIR}/build/install)
+
+install(TARGETS infer_demo DESTINATION ./)
+
+install(DIRECTORY models DESTINATION ./)
+install(DIRECTORY images DESTINATION ./)
+# install(DIRECTORY run_with_adb.sh DESTINATION ./)
+
+file(GLOB FASTDEPLOY_LIBS ${FASTDEPLOY_INSTALL_DIR}/lib/*)
+install(PROGRAMS ${FASTDEPLOY_LIBS} DESTINATION lib)
+
+file(GLOB OPENCV_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/opencv/lib/lib*)
+install(PROGRAMS ${OPENCV_LIBS} DESTINATION lib)
+
+file(GLOB PADDLELITE_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddlelite/lib/lib*)
+install(PROGRAMS ${PADDLELITE_LIBS} DESTINATION lib)
+
+file(GLOB TIMVX_LIBS ${FASTDEPLOY_INSTALL_DIR}/third_libs/install/paddlelite/lib/verisilicon_timvx/*)
+install(PROGRAMS ${TIMVX_LIBS} DESTINATION lib)
+
+file(GLOB ADB_TOOLS run_with_adb.sh)
+install(PROGRAMS ${ADB_TOOLS} DESTINATION ./)
diff --git a/examples/vision/segmentation/paddleseg/a311d/cpp/README.md b/examples/vision/segmentation/paddleseg/a311d/cpp/README.md
new file mode 100755
index 000000000..872784188
--- /dev/null
+++ b/examples/vision/segmentation/paddleseg/a311d/cpp/README.md
@@ -0,0 +1,54 @@
+# PP-LiteSeg 量化模型 C++ 部署示例
+
+本目录下提供的 `infer.cc`，可以帮助用户快速完成 PP-LiteSeg 量化模型在 A311D 上的部署推理加速。
+
+## 部署准备
+### FastDeploy 交叉编译环境准备
+- 1. 软硬件环境满足要求，以及交叉编译环境的准备，请参考：[FastDeploy 交叉编译环境准备](../../../../../../docs/cn/build_and_install/a311d.md#交叉编译环境搭建)  
+
+### 模型准备
+- 1. 用户可以直接使用由 FastDeploy 提供的量化模型进行部署。
+- 2. 用户可以使用 FastDeploy 提供的一键模型自动化压缩工具,自行进行模型量化, 并使用产出的量化模型进行部署.(注意: 推理量化后的分类模型仍然需要FP32模型文件夹下的 deploy.yaml 文件, 自行量化的模型文件夹内不包含此 yaml 文件, 用户从FP32模型文件夹下复制此yaml文件到量化后的模型文件夹内即可.)
+- 更多量化相关相关信息可查阅[模型量化](../../quantize/README.md)
+
+## 在 A311D 上部署量化后的 PP-LiteSeg 分割模型
+请按照以下步骤完成在 A311D 上部署 PP-LiteSeg 量化模型：
+1. 交叉编译编译 FastDeploy 库，具体请参考：[交叉编译 FastDeploy](../../../../../../docs/cn/build_and_install/a311d.md#基于-paddlelite-的-fastdeploy-交叉编译库编译)
+
+2. 将编译后的库拷贝到当前目录，可使用如下命令：
+```bash
+cp -r FastDeploy/build/fastdeploy-tmivx/ FastDeploy/examples/vision/segmentation/paddleseg/a311d/cpp
+```
+
+3. 在当前路径下载部署所需的模型和示例图片：
+```bash
+mkdir models && mkdir images
+wget https://bj.bcebos.com/fastdeploy/models/rk1/ppliteseg.tar.gz
+tar -xvf ppliteseg.tar.gz
+cp -r ppliteseg models
+wget https://paddleseg.bj.bcebos.com/dygraph/demo/cityscapes_demo.png
+cp -r cityscapes_demo.png images
+```
+
+4. 编译部署示例，可使入如下命令：
+```bash
+mkdir build && cd build
+cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/toolchain.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx -DTARGET_ABI=arm64 ..
+make -j8
+make install
+# 成功编译之后，会生成 install 文件夹，里面有一个运行 demo 和部署所需的库
+```
+
+5. 基于 adb 工具部署 PP-LiteSeg 分割模型到晶晨 A311D，可使用如下命令：
+```bash
+# 进入 install 目录
+cd FastDeploy/examples/vision/segmentation/paddleseg/a311d/cpp/build/install/
+# 如下命令表示：bash run_with_adb.sh 需要运行的demo 模型路径 图片路径 设备的DEVICE_ID
+bash run_with_adb.sh infer_demo ppliteseg cityscapes_demo.png $DEVICE_ID
+```
+
+部署成功后运行结果如下：
+
+<img width="640" src="https://user-images.githubusercontent.com/30516196/205544166-9b2719ff-ed82-4908-b90a-095de47392e1.png">
+
+需要特别注意的是，在 A311D 上部署的模型需要是量化后的模型，模型的量化请参考：[模型量化](../../../../../../docs/cn/quantize.md)
diff --git a/examples/vision/segmentation/paddleseg/a311d/cpp/infer.cc b/examples/vision/segmentation/paddleseg/a311d/cpp/infer.cc
new file mode 100755
index 000000000..b6138e8fb
--- /dev/null
+++ b/examples/vision/segmentation/paddleseg/a311d/cpp/infer.cc
@@ -0,0 +1,65 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void InitAndInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "deploy.yaml";
+  auto subgraph_file = model_dir + sep + "subgraph.txt";
+
+  fastdeploy::RuntimeOption option;
+  option.UseTimVX();
+  option.SetLiteSubgraphPartitionPath(subgraph_file);
+  
+  auto model = fastdeploy::vision::segmentation::PaddleSegModel(
+      model_file, params_file, config_file,option);
+
+  assert(model.Initialized());
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::SegmentationResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisSegmentation(im, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 3) {
+    std::cout << "Usage: infer_demo path/to/quant_model "
+                 "path/to/image "
+                 "e.g ./infer_demo ./ResNet50_vd_quant ./test.jpeg"
+              << std::endl;
+    return -1;
+  }
+
+  std::string model_dir = argv[1];
+  std::string test_image = argv[2];
+  InitAndInfer(model_dir, test_image);
+  return 0;
+}
diff --git a/examples/vision/segmentation/paddleseg/a311d/cpp/run_with_adb.sh b/examples/vision/segmentation/paddleseg/a311d/cpp/run_with_adb.sh
new file mode 100755
index 000000000..aacaed4c5
--- /dev/null
+++ b/examples/vision/segmentation/paddleseg/a311d/cpp/run_with_adb.sh
@@ -0,0 +1,47 @@
+#!/bin/bash
+HOST_SPACE=${PWD}
+echo ${HOST_SPACE}
+WORK_SPACE=/data/local/tmp/test
+
+# The first parameter represents the demo name
+DEMO_NAME=image_classification_demo
+if [ -n "$1" ]; then
+  DEMO_NAME=$1
+fi
+
+# The second parameter represents the model name
+MODEL_NAME=mobilenet_v1_fp32_224
+if [ -n "$2" ]; then
+  MODEL_NAME=$2
+fi
+
+# The third parameter indicates the name of the image to be tested
+IMAGE_NAME=0001.jpg
+if [ -n "$3" ]; then
+  IMAGE_NAME=$3
+fi
+
+# The fourth parameter represents the ID of the device
+ADB_DEVICE_NAME=
+if [ -n "$4" ]; then
+  ADB_DEVICE_NAME="-s $4"
+fi
+
+# Set the environment variables required during the running process
+EXPORT_ENVIRONMENT_VARIABLES="export GLOG_v=5; export VIV_VX_ENABLE_GRAPH_TRANSFORM=-pcq:1; export VIV_VX_SET_PER_CHANNEL_ENTROPY=100; export TIMVX_BATCHNORM_FUSION_MAX_ALLOWED_QUANT_SCALE_DEVIATION=300000; export VSI_NN_LOG_LEVEL=5;"
+
+EXPORT_ENVIRONMENT_VARIABLES="${EXPORT_ENVIRONMENT_VARIABLES}export LD_LIBRARY_PATH=${WORK_SPACE}/lib:\$LD_LIBRARY_PATH;"
+
+# Please install adb, and DON'T run this in the docker.
+set -e
+adb $ADB_DEVICE_NAME shell "rm -rf $WORK_SPACE"
+adb $ADB_DEVICE_NAME shell "mkdir -p $WORK_SPACE"
+
+# Upload the demo, librarys, model and test images to the device
+adb $ADB_DEVICE_NAME push ${HOST_SPACE}/lib $WORK_SPACE
+adb $ADB_DEVICE_NAME push ${HOST_SPACE}/${DEMO_NAME} $WORK_SPACE
+adb $ADB_DEVICE_NAME push models $WORK_SPACE
+adb $ADB_DEVICE_NAME push images $WORK_SPACE
+
+# Execute the deployment demo
+adb $ADB_DEVICE_NAME shell "cd $WORK_SPACE; ${EXPORT_ENVIRONMENT_VARIABLES} chmod +x ./${DEMO_NAME}; ./${DEMO_NAME} ./models/${MODEL_NAME} ./images/$IMAGE_NAME"
diff --git a/examples/vision/segmentation/paddleseg/rv1126/cpp/README.md b/examples/vision/segmentation/paddleseg/rv1126/cpp/README.md
index 6295fa728..bf7cafc3b 100755
--- a/examples/vision/segmentation/paddleseg/rv1126/cpp/README.md
+++ b/examples/vision/segmentation/paddleseg/rv1126/cpp/README.md
@@ -33,7 +33,7 @@ cp -r cityscapes_demo.png images
 4. 编译部署示例，可使入如下命令：
 ```bash
 mkdir build && cd build
-cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/timvx.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx ..
+cmake -DCMAKE_TOOLCHAIN_FILE=${PWD}/../fastdeploy-tmivx/toolchain.cmake -DFASTDEPLOY_INSTALL_DIR=${PWD}/../fastdeploy-tmivx -DTARGET_ABI=armhf ..
 make -j8
 make install
 # 成功编译之后，会生成 install 文件夹，里面有一个运行 demo 和部署所需的库
diff --git a/examples/vision/segmentation/paddleseg/rv1126/cpp/infer.cc b/examples/vision/segmentation/paddleseg/rv1126/cpp/infer.cc
index 8c9c7456c..f084e6719 100755
--- a/examples/vision/segmentation/paddleseg/rv1126/cpp/infer.cc
+++ b/examples/vision/segmentation/paddleseg/rv1126/cpp/infer.cc
@@ -53,7 +53,6 @@ int main(int argc, char* argv[]) {
   if (argc < 3) {
     std::cout << "Usage: infer_demo path/to/quant_model "
                  "path/to/image "
-                 "run_option, "
                  "e.g ./infer_demo ./ResNet50_vd_quant ./test.jpeg"
               << std::endl;
     return -1;
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/utils.h b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
index 23efa25c8..1d28b5f0e 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/utils.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
@@ -12,6 +12,7 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 #pragma once
+#include <stdint.h>
 #include <cmath>
 #include <vector>
 
diff --git a/tools/timvx/install.sh b/tools/timvx/install.sh
new file mode 100644
index 000000000..b499b09a1
--- /dev/null
+++ b/tools/timvx/install.sh
@@ -0,0 +1,17 @@
+# 1. Install basic software
+apt update
+apt-get install -y --no-install-recommends \
+  gcc g++ git make wget python unzip
+
+# 2. Install arm gcc toolchains
+apt-get install -y --no-install-recommends \
+  g++-arm-linux-gnueabi gcc-arm-linux-gnueabi \
+  g++-arm-linux-gnueabihf gcc-arm-linux-gnueabihf \
+  gcc-aarch64-linux-gnu g++-aarch64-linux-gnu
+
+# 3. Install cmake 3.10 or above
+wget -c https://mms-res.cdn.bcebos.com/cmake-3.10.3-Linux-x86_64.tar.gz && \
+  tar xzf cmake-3.10.3-Linux-x86_64.tar.gz && \
+  mv cmake-3.10.3-Linux-x86_64 /opt/cmake-3.10 && \
+  ln -s /opt/cmake-3.10/bin/cmake /usr/bin/cmake && \
+  ln -s /opt/cmake-3.10/bin/ccmake /usr/bin/ccmake

From 9937b6c3250085fad053d3110281624dc9d5d3af Mon Sep 17 00:00:00 2001
From: huangjianhui <852142024@qq.com>
Date: Tue, 13 Dec 2022 15:19:47 +0800
Subject: [PATCH 33/77] [Other] Add Model Clone function for PaddleClas &&
 PaddleDet && PaddleSeg (#791)

* Refactor PaddleSeg with preprocessor && postprocessor

* Fix bugs

* Delete redundancy code

* Modify by comments

* Refactor according to comments

* Add batch evaluation

* Add single test script

* Add ppliteseg single test script && fix eval(raise) error

* fix bug

* Fix evaluation segmentation.py batch predict

* Fix segmentation evaluation bug

* Fix evaluation segmentation bugs

* Update segmentation result docs

* Update old predict api and DisableNormalizeAndPermute

* Update resize segmentation label map with cv::INTER_NEAREST

* Add Model Clone function for PaddleClas && PaddleDet && PaddleSeg

* Add multi thread demo

* Add python model clone function

* Add multi thread python && C++ example

* Fix bug

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 fastdeploy/fastdeploy_model.h                 |  14 ++
 .../vision/classification/ppcls/model.cc      |   7 +
 .../vision/classification/ppcls/model.h       |   6 +
 .../classification/ppcls/ppcls_pybind.cc      |   3 +
 fastdeploy/vision/detection/ppdet/base.cc     |   7 +
 fastdeploy/vision/detection/ppdet/base.h      |   6 +
 .../vision/detection/ppdet/ppdet_pybind.cc    |   3 +
 fastdeploy/vision/segmentation/ppseg/model.cc |   7 +
 fastdeploy/vision/segmentation/ppseg/model.h  |   6 +
 .../vision/segmentation/ppseg/ppseg_pybind.cc |   3 +
 .../vision/classification/ppcls/__init__.py   |  13 ++
 .../vision/detection/ppdet/__init__.py        | 110 ++++++++++++++-
 .../vision/segmentation/ppseg/__init__.py     |  13 ++
 tutorials/multi_thread.cc                     | 132 ++++++++++++++++++
 tutorials/multi_thread.py                     | 128 +++++++++++++++++
 15 files changed, 455 insertions(+), 3 deletions(-)
 create mode 100644 tutorials/multi_thread.cc
 create mode 100644 tutorials/multi_thread.py

diff --git a/fastdeploy/fastdeploy_model.h b/fastdeploy/fastdeploy_model.h
index 717639694..5a6efba09 100755
--- a/fastdeploy/fastdeploy_model.h
+++ b/fastdeploy/fastdeploy_model.h
@@ -112,6 +112,20 @@ class FASTDEPLOY_DECL FastDeployModel {
     std::vector<FDTensor>().swap(reused_output_tensors_);
   }
 
+  virtual fastdeploy::Runtime* CloneRuntime() {
+    return runtime_->Clone();
+  }
+
+  virtual bool SetRuntime(fastdeploy::Runtime* clone_runtime) {
+    runtime_ = std::unique_ptr<Runtime>(clone_runtime);
+    return true;
+  }
+
+  virtual std::unique_ptr<FastDeployModel> Clone() {
+    FDERROR << ModelName() << " doesn't support Cone() now." << std::endl;
+    return nullptr;
+  }
+
  protected:
   virtual bool InitRuntime();
 
diff --git a/fastdeploy/vision/classification/ppcls/model.cc b/fastdeploy/vision/classification/ppcls/model.cc
index ee87e8882..5065bbfc2 100755
--- a/fastdeploy/vision/classification/ppcls/model.cc
+++ b/fastdeploy/vision/classification/ppcls/model.cc
@@ -13,6 +13,7 @@
 // limitations under the License.
 
 #include "fastdeploy/vision/classification/ppcls/model.h"
+#include "fastdeploy/utils/unique_ptr.h"
 
 namespace fastdeploy {
 namespace vision {
@@ -41,6 +42,12 @@ PaddleClasModel::PaddleClasModel(const std::string& model_file,
   initialized = Initialize();
 }
 
+std::unique_ptr<PaddleClasModel>  PaddleClasModel::Clone() const {
+  std::unique_ptr<PaddleClasModel> clone_model = utils::make_unique<PaddleClasModel>(PaddleClasModel(*this));
+  clone_model->SetRuntime(clone_model->CloneRuntime());
+  return clone_model;
+}
+
 bool PaddleClasModel::Initialize() {
   if (!InitRuntime()) {
     FDERROR << "Failed to initialize fastdeploy backend." << std::endl;
diff --git a/fastdeploy/vision/classification/ppcls/model.h b/fastdeploy/vision/classification/ppcls/model.h
index e24477073..5971147fb 100644
--- a/fastdeploy/vision/classification/ppcls/model.h
+++ b/fastdeploy/vision/classification/ppcls/model.h
@@ -40,6 +40,12 @@ class FASTDEPLOY_DECL PaddleClasModel : public FastDeployModel {
                   const RuntimeOption& custom_option = RuntimeOption(),
                   const ModelFormat& model_format = ModelFormat::PADDLE);
 
+  /** \brief Clone a new PaddleClasModel with less memory usage when multiple instances of the same model are created
+   *
+   * \return new PaddleClasModel* type unique pointer
+   */
+  virtual std::unique_ptr<PaddleClasModel> Clone() const;
+
   /// Get model's name
   virtual std::string ModelName() const { return "PaddleClas/Model"; }
 
diff --git a/fastdeploy/vision/classification/ppcls/ppcls_pybind.cc b/fastdeploy/vision/classification/ppcls/ppcls_pybind.cc
index 4d54c1405..1873e73e5 100644
--- a/fastdeploy/vision/classification/ppcls/ppcls_pybind.cc
+++ b/fastdeploy/vision/classification/ppcls/ppcls_pybind.cc
@@ -63,6 +63,9 @@ void BindPaddleClas(pybind11::module& m) {
       m, "PaddleClasModel")
       .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                           ModelFormat>())
+      .def("clone", [](vision::classification::PaddleClasModel& self) {
+        return self.Clone();
+      })
       .def("predict", [](vision::classification::PaddleClasModel& self, pybind11::array& data) {
         cv::Mat im = PyArrayToCvMat(data);
         vision::ClassifyResult result;
diff --git a/fastdeploy/vision/detection/ppdet/base.cc b/fastdeploy/vision/detection/ppdet/base.cc
index 0d4e0f290..489e63634 100755
--- a/fastdeploy/vision/detection/ppdet/base.cc
+++ b/fastdeploy/vision/detection/ppdet/base.cc
@@ -1,6 +1,7 @@
 #include "fastdeploy/vision/detection/ppdet/base.h"
 #include "fastdeploy/vision/utils/utils.h"
 #include "yaml-cpp/yaml.h"
+#include "fastdeploy/utils/unique_ptr.h"
 
 namespace fastdeploy {
 namespace vision {
@@ -18,6 +19,12 @@ PPDetBase::PPDetBase(const std::string& model_file,
   runtime_option.params_file = params_file;
 }
 
+std::unique_ptr<PPDetBase>  PPDetBase::Clone() const {
+  std::unique_ptr<PPDetBase> clone_model = fastdeploy::utils::make_unique<PPDetBase>(PPDetBase(*this));
+  clone_model->SetRuntime(clone_model->CloneRuntime());
+  return clone_model;
+}
+
 bool PPDetBase::Initialize() {
   if (!InitRuntime()) {
     FDERROR << "Failed to initialize fastdeploy backend." << std::endl;
diff --git a/fastdeploy/vision/detection/ppdet/base.h b/fastdeploy/vision/detection/ppdet/base.h
index bffc477a5..7465d54b9 100644
--- a/fastdeploy/vision/detection/ppdet/base.h
+++ b/fastdeploy/vision/detection/ppdet/base.h
@@ -45,6 +45,12 @@ class FASTDEPLOY_DECL PPDetBase : public FastDeployModel {
           const RuntimeOption& custom_option = RuntimeOption(),
           const ModelFormat& model_format = ModelFormat::PADDLE);
 
+  /** \brief Clone a new PaddleDetModel with less memory usage when multiple instances of the same model are created
+   *
+   * \return new PaddleDetModel* type unique pointer
+   */
+  virtual std::unique_ptr<PPDetBase> Clone() const;
+
   /// Get model's name
   virtual std::string ModelName() const { return "PaddleDetection/BaseModel"; }
 
diff --git a/fastdeploy/vision/detection/ppdet/ppdet_pybind.cc b/fastdeploy/vision/detection/ppdet/ppdet_pybind.cc
index fedf3f795..e55561cdc 100644
--- a/fastdeploy/vision/detection/ppdet/ppdet_pybind.cc
+++ b/fastdeploy/vision/detection/ppdet/ppdet_pybind.cc
@@ -77,6 +77,9 @@ void BindPPDet(pybind11::module& m) {
              self.BatchPredict(images, &results);
              return results;
            })
+      .def("clone", [](vision::detection::PPDetBase& self) {
+        return self.Clone();
+      })
       .def_property_readonly("preprocessor", &vision::detection::PPDetBase::GetPreprocessor)
       .def_property_readonly("postprocessor", &vision::detection::PPDetBase::GetPostprocessor);
 
diff --git a/fastdeploy/vision/segmentation/ppseg/model.cc b/fastdeploy/vision/segmentation/ppseg/model.cc
index ad2a7773a..99fd922ed 100755
--- a/fastdeploy/vision/segmentation/ppseg/model.cc
+++ b/fastdeploy/vision/segmentation/ppseg/model.cc
@@ -13,6 +13,7 @@
 // limitations under the License.
 
 #include "fastdeploy/vision/segmentation/ppseg/model.h"
+#include "fastdeploy/utils/unique_ptr.h"
 
 namespace fastdeploy {
 namespace vision {
@@ -35,6 +36,12 @@ PaddleSegModel::PaddleSegModel(const std::string& model_file,
   initialized = Initialize();
 }
 
+std::unique_ptr<PaddleSegModel>  PaddleSegModel::Clone() const {
+  std::unique_ptr<PaddleSegModel> clone_model = fastdeploy::utils::make_unique<PaddleSegModel>(PaddleSegModel(*this));
+  clone_model->SetRuntime(clone_model->CloneRuntime());
+  return clone_model;
+}
+
 bool PaddleSegModel::Initialize() {
   if (!InitRuntime()) {
     FDERROR << "Failed to initialize fastdeploy backend." << std::endl;
diff --git a/fastdeploy/vision/segmentation/ppseg/model.h b/fastdeploy/vision/segmentation/ppseg/model.h
index bf6d6f5b1..414005240 100644
--- a/fastdeploy/vision/segmentation/ppseg/model.h
+++ b/fastdeploy/vision/segmentation/ppseg/model.h
@@ -41,6 +41,12 @@ class FASTDEPLOY_DECL PaddleSegModel : public FastDeployModel {
                  const RuntimeOption& custom_option = RuntimeOption(),
                  const ModelFormat& model_format = ModelFormat::PADDLE);
 
+  /** \brief Clone a new PaddleSegModel with less memory usage when multiple instances of the same model are created
+   *
+   * \return new PaddleDetModel* type unique pointer
+   */
+  virtual std::unique_ptr<PaddleSegModel> Clone() const;
+
   /// Get model's name
   std::string ModelName() const { return "PaddleSeg"; }
 
diff --git a/fastdeploy/vision/segmentation/ppseg/ppseg_pybind.cc b/fastdeploy/vision/segmentation/ppseg/ppseg_pybind.cc
index 34642b62a..e687d3cc4 100644
--- a/fastdeploy/vision/segmentation/ppseg/ppseg_pybind.cc
+++ b/fastdeploy/vision/segmentation/ppseg/ppseg_pybind.cc
@@ -47,6 +47,9 @@ void BindPPSeg(pybind11::module& m) {
       m, "PaddleSegModel")
       .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                           ModelFormat>())
+      .def("clone", [](vision::segmentation::PaddleSegModel& self) {
+        return self.Clone();
+      })
       .def("predict",
            [](vision::segmentation::PaddleSegModel& self,
               pybind11::array& data) {
diff --git a/python/fastdeploy/vision/classification/ppcls/__init__.py b/python/fastdeploy/vision/classification/ppcls/__init__.py
index 75f20af38..91fa66c4a 100644
--- a/python/fastdeploy/vision/classification/ppcls/__init__.py
+++ b/python/fastdeploy/vision/classification/ppcls/__init__.py
@@ -85,6 +85,19 @@ class PaddleClasModel(FastDeployModel):
             model_format)
         assert self.initialized, "PaddleClas model initialize failed."
 
+    def clone(self):
+        """Clone PaddleClasModel object
+
+        :return: a new PaddleClasModel object
+        """
+
+        class PaddleClasCloneModel(PaddleClasModel):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = PaddleClasCloneModel(self._model.clone())
+        return clone_model
+
     def predict(self, im, topk=1):
         """Classify an input image
 
diff --git a/python/fastdeploy/vision/detection/ppdet/__init__.py b/python/fastdeploy/vision/detection/ppdet/__init__.py
index ec5cd1925..2e84e8ce0 100644
--- a/python/fastdeploy/vision/detection/ppdet/__init__.py
+++ b/python/fastdeploy/vision/detection/ppdet/__init__.py
@@ -99,6 +99,19 @@ class PPYOLOE(FastDeployModel):
 
         return self._model.batch_predict(images)
 
+    def clone(self):
+        """Clone PPYOLOE object
+
+        :return: a new PPYOLOE object
+        """
+
+        class PPYOLOEClone(PPYOLOE):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = PPYOLOEClone(self._model.clone())
+        return clone_model
+
     @property
     def preprocessor(self):
         """Get PaddleDetPreprocessor object of the loaded model
@@ -139,6 +152,19 @@ class PPYOLO(PPYOLOE):
             model_format)
         assert self.initialized, "PPYOLO model initialize failed."
 
+    def clone(self):
+        """Clone PPYOLO object
+
+        :return: a new PPYOLO object
+        """
+
+        class PPYOLOClone(PPYOLO):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = PPYOLOClone(self._model.clone())
+        return clone_model
+
 
 class PaddleYOLOX(PPYOLOE):
     def __init__(self,
@@ -164,6 +190,19 @@ class PaddleYOLOX(PPYOLOE):
             model_format)
         assert self.initialized, "PaddleYOLOX model initialize failed."
 
+    def clone(self):
+        """Clone PaddleYOLOX object
+
+        :return: a new PaddleYOLOX object
+        """
+
+        class PaddleYOLOXClone(PaddleYOLOX):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = PaddleYOLOXClone(self._model.clone())
+        return clone_model
+
 
 class PicoDet(PPYOLOE):
     def __init__(self,
@@ -188,6 +227,19 @@ class PicoDet(PPYOLOE):
             model_format)
         assert self.initialized, "PicoDet model initialize failed."
 
+    def clone(self):
+        """Clone PicoDet object
+
+        :return: a new PicoDet object
+        """
+
+        class PicoDetClone(PicoDet):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = PicoDetClone(self._model.clone())
+        return clone_model
+
 
 class FasterRCNN(PPYOLOE):
     def __init__(self,
@@ -213,6 +265,19 @@ class FasterRCNN(PPYOLOE):
             model_format)
         assert self.initialized, "FasterRCNN model initialize failed."
 
+    def clone(self):
+        """Clone FasterRCNN object
+
+        :return: a new FasterRCNN object
+        """
+
+        class FasterRCNNClone(FasterRCNN):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = FasterRCNNClone(self._model.clone())
+        return clone_model
+
 
 class YOLOv3(PPYOLOE):
     def __init__(self,
@@ -238,6 +303,19 @@ class YOLOv3(PPYOLOE):
             model_format)
         assert self.initialized, "YOLOv3 model initialize failed."
 
+    def clone(self):
+        """Clone YOLOv3 object
+
+        :return: a new YOLOv3 object
+        """
+
+        class YOLOv3Clone(YOLOv3):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = YOLOv3Clone(self._model.clone())
+        return clone_model
+
 
 class MaskRCNN(PPYOLOE):
     def __init__(self,
@@ -273,6 +351,19 @@ class MaskRCNN(PPYOLOE):
         raise Exception(
             "batch_predict is not supported for MaskRCNN model now.")
 
+    def clone(self):
+        """Clone MaskRCNN object
+
+        :return: a new MaskRCNN object
+        """
+
+        class MaskRCNNClone(MaskRCNN):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = MaskRCNNClone(self._model.clone())
+        return clone_model
+
 
 class SSD(PPYOLOE):
     def __init__(self,
@@ -293,7 +384,20 @@ class SSD(PPYOLOE):
         super(PPYOLOE, self).__init__(runtime_option)
 
         assert model_format == ModelFormat.PADDLE, "SSD model only support model format of ModelFormat.Paddle now."
-        self._model = C.vision.detection.SSD(
-            model_file, params_file, config_file, self._runtime_option,
-            model_format)
+        self._model = C.vision.detection.SSD(model_file, params_file,
+                                             config_file, self._runtime_option,
+                                             model_format)
         assert self.initialized, "SSD model initialize failed."
+
+    def clone(self):
+        """Clone SSD object
+
+        :return: a new SSD object
+        """
+
+        class SSDClone(SSD):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = SSDClone(self._model.clone())
+        return clone_model
diff --git a/python/fastdeploy/vision/segmentation/ppseg/__init__.py b/python/fastdeploy/vision/segmentation/ppseg/__init__.py
index 7a18b7964..455785686 100644
--- a/python/fastdeploy/vision/segmentation/ppseg/__init__.py
+++ b/python/fastdeploy/vision/segmentation/ppseg/__init__.py
@@ -57,6 +57,19 @@ class PaddleSegModel(FastDeployModel):
         """
         return self._model.batch_predict(image_list)
 
+    def clone(self):
+        """Clone PaddleSegModel object
+
+        :return: a new PaddleSegModel object
+        """
+
+        class PaddleSegCloneModel(PaddleSegModel):
+            def __init__(self, model):
+                self._model = model
+
+        clone_model = PaddleSegCloneModel(self._model.clone())
+        return clone_model
+
     @property
     def preprocessor(self):
         """Get PaddleSegPreprocessor object of the loaded model
diff --git a/tutorials/multi_thread.cc b/tutorials/multi_thread.cc
new file mode 100644
index 000000000..6cc01b5d3
--- /dev/null
+++ b/tutorials/multi_thread.cc
@@ -0,0 +1,132 @@
+#include <thread>
+#include "fastdeploy/vision.h"
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void predict(fastdeploy::vision::classification::PaddleClasModel *model, int thread_id, const std::string& image_file) {
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::ClassifyResult res;
+  if (!model->Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  // print res
+  std::cout << "Thread Id: " << thread_id << std::endl;
+  std::cout << res.Str() << std::endl;
+}
+
+void CpuInfer(const std::string& model_dir, const std::string& image_file, int thread_num) {
+  auto model_file = model_dir + sep + "inference.pdmodel";
+  auto params_file = model_dir + sep + "inference.pdiparams";
+  auto config_file = model_dir + sep + "inference_cls.yaml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseCpu();
+  auto model = fastdeploy::vision::classification::PaddleClasModel(
+      model_file, params_file, config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  std::vector<decltype(model.Clone())> models;
+  for (int i = 0; i < thread_num; ++i) {
+    models.emplace_back(std::move(model.Clone()));
+  }
+
+  std::vector<std::thread> threads;
+  for (int i = 0; i < thread_num; ++i) {
+    threads.emplace_back(predict, models[i].get(), i, image_file);
+  }
+
+  for (int i = 0; i < thread_num; ++i) {
+    threads[i].join();
+  }
+}
+
+void GpuInfer(const std::string& model_dir, const std::string& image_file, int thread_num) {
+  auto model_file = model_dir + sep + "inference.pdmodel";
+  auto params_file = model_dir + sep + "inference.pdiparams";
+  auto config_file = model_dir + sep + "inference_cls.yaml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UsePaddleBackend();
+  auto model = fastdeploy::vision::classification::PaddleClasModel(
+      model_file, params_file, config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  std::vector<decltype(model.Clone())> models;
+  for (int i = 0; i < thread_num; ++i) {
+    models.emplace_back(std::move(model.Clone()));
+  }
+
+  std::vector<std::thread> threads;
+  for (int i = 0; i < thread_num; ++i) {
+    threads.emplace_back(predict, models[i].get(), i, image_file);
+  }
+
+  for (int i = 0; i < thread_num; ++i) {
+    threads[i].join();
+  }
+}
+
+void TrtInfer(const std::string& model_dir, const std::string& image_file, int thread_num) {
+  auto model_file = model_dir + sep + "inference.pdmodel";
+  auto params_file = model_dir + sep + "inference.pdiparams";
+  auto config_file = model_dir + sep + "inference_cls.yaml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UseTrtBackend();
+  // for model.Clone() must SetTrtInputShape first
+  option.SetTrtInputShape("inputs", {1, 3, 224, 224});
+  auto model = fastdeploy::vision::classification::PaddleClasModel(
+      model_file, params_file, config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  std::vector<decltype(model.Clone())> models;
+  for (int i = 0; i < thread_num; ++i) {
+    models.emplace_back(std::move(model.Clone()));
+  }
+
+  std::vector<std::thread> threads;
+  for (int i = 0; i < thread_num; ++i) {
+    threads.emplace_back(predict, models[i].get(), i, image_file);
+  }
+
+  for (int i = 0; i < thread_num; ++i) {
+    threads[i].join();
+  }
+}
+
+int main(int argc, char **argv) {
+  if (argc < 5) {
+    std::cout << "Usage: infer_demo path/to/model path/to/image run_option thread_num, "
+                 "e.g ./infer_demo ./ResNet50_vd ./test.jpeg 0 3"
+              << std::endl;
+    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
+                 "with gpu; 2: run with gpu and use tensorrt backend."
+              << std::endl;
+    return -1;
+  }
+
+  if (std::atoi(argv[3]) == 0) {
+    CpuInfer(argv[1], argv[2], std::atoi(argv[4]));
+  } else if (std::atoi(argv[3]) == 1) {
+    GpuInfer(argv[1], argv[2], std::atoi(argv[4]));
+  } else if (std::atoi(argv[3]) == 2) {
+    TrtInfer(argv[1], argv[2], std::atoi(argv[4]));
+  } 
+  return 0;
+}
+
diff --git a/tutorials/multi_thread.py b/tutorials/multi_thread.py
new file mode 100644
index 000000000..27d3b3331
--- /dev/null
+++ b/tutorials/multi_thread.py
@@ -0,0 +1,128 @@
+import numpy as np
+from threading import Thread
+import fastdeploy as fd
+import cv2
+import os
+import psutil
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model", required=True, help="Path of PaddleClas model.")
+    parser.add_argument(
+        "--image_path",
+        type=str,
+        required=True,
+        help="The directory or path or file list of the images to be predicted."
+    )
+    parser.add_argument(
+        "--topk", type=int, default=1, help="Return topk results.")
+    parser.add_argument(
+        "--device",
+        type=str,
+        default='cpu',
+        help="Type of inference device, support 'cpu' or 'gpu' or 'ipu'.")
+    parser.add_argument(
+        "--use_trt",
+        type=ast.literal_eval,
+        default=False,
+        help="Wether to use tensorrt.")
+    parser.add_argument("--thread_num", type=int, default=1, help="thread num")
+    return parser.parse_args()
+
+
+def get_image_list(image_path):
+    image_list = []
+    if os.path.isfile(image_path):
+        image_list.append(image_path)
+    # load image in a directory
+    elif os.path.isdir(image_path):
+        for root, dirs, files in os.walk(image_path):
+            for f in files:
+                image_list.append(os.path.join(root, f))
+    else:
+        raise FileNotFoundError(
+            '{} is not found. it should be a path of image, or a directory including images.'.
+            format(image_path))
+
+    if len(image_list) == 0:
+        raise RuntimeError(
+            'There are not image file in `--image_path`={}'.format(image_path))
+
+    return image_list
+
+
+def build_option(args):
+    option = fd.RuntimeOption()
+
+    if args.device.lower() == "gpu":
+        option.use_gpu()
+
+    if args.device.lower() == "ipu":
+        option.use_ipu()
+
+    if args.use_trt:
+        option.use_trt_backend()
+    return option
+
+
+def predict(model, img_list, topk):
+    result_list = []
+    # 预测图片分类结果
+    for image in img_list:
+        im = cv2.imread(image)
+        result = model.predict(im, topk)
+        result_list.append(result)
+    return result_list
+
+
+class WrapperThread(Thread):
+    def __init__(self, func, args):
+        super(WrapperThread, self).__init__()
+        self.func = func
+        self.args = args
+
+    def run(self):
+        self.result = self.func(*self.args)
+
+    def get_result(self):
+        return self.result
+
+
+if __name__ == '__main__':
+    args = parse_arguments()
+
+    thread_num = args.thread_num
+    imgs_list = get_image_list(args.image_path)
+    # 配置runtime，加载模型
+    runtime_option = build_option(args)
+
+    model_file = os.path.join(args.model, "inference.pdmodel")
+    params_file = os.path.join(args.model, "inference.pdiparams")
+    config_file = os.path.join(args.model, "inference_cls.yaml")
+    model = fd.vision.classification.PaddleClasModel(
+        model_file, params_file, config_file, runtime_option=runtime_option)
+    threads = []
+    image_num_each_thread = int(len(imgs_list) / thread_num)
+    for i in range(thread_num):
+        if i == thread_num - 1:
+            t = WrapperThread(
+                predict,
+                args=(model, imgs_list[i * image_num_each_thread:], i))
+        else:
+            t = WrapperThread(
+                predict,
+                args=(model.clone(), imgs_list[i * image_num_each_thread:(
+                    i + 1) * image_num_each_thread - 1], i))
+        threads.append(t)
+        t.start()
+
+    for i in range(thread_num):
+        threads[i].join()
+
+    for i in range(thread_num):
+        for result in threads[i].get_result():
+            print('thread:', i, ', result: ', result)

From 7ba823e1e761911f69af860454ae7ab9eb4e66a1 Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Tue, 13 Dec 2022 16:37:36 +0800
Subject: [PATCH 34/77] =?UTF-8?q?Create=20README=5F=E6=97=A5=E6=9C=AC?=
 =?UTF-8?q?=E8=AA=9E.md?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 docs/docs_i18n/README_日本語.md | 334 ++++++++++++++++++++++++++++++++
 1 file changed, 334 insertions(+)
 create mode 100644 docs/docs_i18n/README_日本語.md

diff --git a/docs/docs_i18n/README_日本語.md b/docs/docs_i18n/README_日本語.md
new file mode 100644
index 000000000..8ca76f1f3
--- /dev/null
+++ b/docs/docs_i18n/README_日本語.md
@@ -0,0 +1,334 @@
+[English](../../README_EN.md) | [简体中文](../../README_CN.md) | [हिन्दी](./README_हिन्दी.md) | 日本語 | [한국인](./README_한국어.md) | [Pу́сский язы́к](.//README_Ру́сский_язы́к.md)
+
+![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)
+
+</p>
+
+<p align="center">
+    <a href="./LICENSE"><img src="https://img.shields.io/badge/license-Apache%202-dfd.svg"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/releases"><img src="https://img.shields.io/github/v/release/PaddlePaddle/FastDeploy?color=ffa"></a>
+    <a href=""><img src="https://img.shields.io/badge/python-3.7+-aff.svg"></a>
+    <a href=""><img src="https://img.shields.io/badge/os-linux%2C%20win%2C%20mac-pink.svg"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/graphs/contributors"><img src="https://img.shields.io/github/contributors/PaddlePaddle/FastDeploy?color=9ea"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/commits"><img src="https://img.shields.io/github/commit-activity/m/PaddlePaddle/FastDeploy?color=3af"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/issues"><img src="https://img.shields.io/github/issues/PaddlePaddle/FastDeploy?color=9cc"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/stargazers"><img src="https://img.shields.io/github/stars/PaddlePaddle/FastDeploy?color=ccf"></a>
+</p>
+
+<p align="center">
+    <a href="/docs/cn/build_and_install"><b> インストール </b></a>
+    |
+    <a href="docs/README_CN.md"><b> ドキュメント </b></a>
+    |
+    <a href="https://baidu-paddle.github.io/fastdeploy-api/"><b> APIドキュメンテーション </b></a>
+    |
+    <a href="https://github.com/PaddlePaddle/FastDeploy/releases"><b> Changelog </b></a>
+</p>
+
+**⚡️FastDeploy**は、**オールシナリオで使いやすく**、**柔軟で非常に効率的な**AI推論デプロイツールです。 🔥150以上の**テキスト**、**ビジョン**、**スピーチ**および🔚クロスモーダルモデルをサポートし、エンドツーエンドの推論パフォーマンスの最適化を可能にする、すぐに使えるクラウド側のデプロイメントエクスペリエンスを提供します。 これには、画像分類、物体検出、画像分割、顔検出、顔認識、キーポイント検出、キーイング、OCR、NLP、TTSなどのタスクが含まれ、**マルチシーン**、**マルチハードウェア**、**マルチプラットフォーム**の産業展開に対する開発者のニーズに応えています。
+| [Image Classification](examples/vision/classification)                                                                                         | [Object Detection](examples/vision/detection)                                                                                                  | [Semantic Segmentation](examples/vision/segmentation/paddleseg)                                                                                  | [Potrait Segmentation](examples/vision/segmentation/paddleseg)                                                                                                                                                                                                                                                                                                           |
+|:----------------------------------------------------------------------------------------------------------------------------------------------:|:----------------------------------------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|
+| <img src='https://user-images.githubusercontent.com/54695910/200465949-da478e1b-21ce-43b8-9f3f-287460e786bd.png' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054680-2f8d1952-c120-4b67-88fc-7d2d7d2378b4.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054711-6119f0e7-d741-43b1-b273-9493d103d49f.gif' height="126px" width="190px">   | <img src='https://user-images.githubusercontent.com/54695910/188054718-6395321c-8937-4fa0-881c-5b20deb92aaa.gif' height="126px" width="190px">                                                                                                                                                                                                                           |
+| [**Image Matting**](examples/vision/matting)                                                                                                   | [**Real-Time Matting**](examples/vision/matting)                                                                                               | [**OCR**](examples/vision/ocr)                                                                                                                   | [**Face Alignment**](examples/vision/facealign)                                                                                                                                                                                                                                                                                                                          |
+| <img src='https://user-images.githubusercontent.com/54695910/188058231-a5fe1ce1-0a38-460f-9582-e0b881514908.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054691-e4cb1a70-09fe-4691-bc62-5552d50bd853.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054669-a85996ba-f7f3-4646-ae1f-3b7e3e353e7d.gif' height="126px" width="190px"  > | <img src='https://user-images.githubusercontent.com/54695910/188059460-9845e717-c30a-4252-bd80-b7f6d4cf30cb.png' height="126px" width="190px">                                                                                                                                                                                                                           |
+| [**Pose Estimation**](examples/vision/keypointdetection)                                                                                       | [**Behavior Recognition**](https://github.com/PaddlePaddle/FastDeploy/issues/6)                                                                | [**NLP**](examples/text)                                                                                                                         | [**Speech**](examples/audio/pp-tts)                                                                                                                                                                                                                                                                                                                                      |
+| <img src='https://user-images.githubusercontent.com/54695910/188054671-394db8dd-537c-42b1-9d90-468d7ad1530e.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/48054808/173034825-623e4f78-22a5-4f14-9b83-dc47aa868478.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/200162475-f5d85d70-18fb-4930-8e7e-9ca065c1d618.gif' height="126px" width="190px">   | <p align="left">**input** ：早上好今天是2020<br>/10/29，最低温度是-3°C。<br><br> <p align="left">**output**: [<img src="https://user-images.githubusercontent.com/54695910/200161645-871e08da-5a31-4736-879c-a88bb171a676.png" width="170" style="max-width: 100%;">](https://paddlespeech.bj.bcebos.com/Parakeet/docs/demos/parakeet_espnet_fs2_pwg_demo/tn_g2p/parakeet/001.wav)</p> |
+
+
+## **地域交流**
+
+*  **Slack**：Join our [Slack community](https://join.slack.com/t/fastdeployworkspace/shared_invite/zt-1jznah134-3rxY~ytRb8rcPqkn9g~PDg) and chat with other community members about ideas
+
+*  **WeChat**: QRコードをスキャンしてアンケートに回答すると、テクニカルコミュニティに参加でき、コミュニティの開発者と導入時の問題点や解決策について議論することができます。
+
+<div align="center">
+    <img src="https://user-images.githubusercontent.com/54695910/200145290-d5565d18-6707-4a0b-a9af-85fd36d35d13.jpg" width = "220" height = "220" />
+</div>
+
+## カタログ
+
+* **🖥️ サーバーサイドのデプロイメント**
+
+  * [Python SDK クイックスタート](#fastdeploy-quick-start-python)  
+  * [C++ SDK クイックスタート](#fastdeploy-quick-start-cpp)
+  * [サーバーサイドモデル対応表](#fastdeploy-server-models)
+
+* **📲 モバイルとエンドサイドデプロイメント**
+
+  * [エンドサイドモデル対応表](#fastdeploy-edge-models)
+
+* **🌐 Webとアプレットの展開**  
+
+  * [Webサイドモデル対応表](#fastdeploy-web-models)
+* [Acknowledge](#fastdeploy-acknowledge)  
+* [License](#fastdeploy-license)
+
+## 🖥️ サーバーサイドのデプロイメント
+
+<div id="fastdeploy-quick-start-python"></div>
+
+<details close>
+
+<summary><b>Python SDK クイックスタート(クリックで詳細表示)</b></summary><div>
+
+#### クイックインストール
+
+##### プリディペンデンス
+
+- CUDA >= 11.2、cuDNN >= 8.0、Python >= 3.6
+- OS: Linux x86_64/macOS/Windows 10
+
+##### GPU版のインストール
+
+```bash
+pip install numpy opencv-python fastdeploy-gpu-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
+```
+
+##### [Condaのインストール（推奨）](docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+```bash
+conda config --add channels conda-forge && conda install cudatoolkit=11.2 cudnn=8.2
+```
+
+##### CPUバージョンのインストール
+
+```bash
+pip install numpy opencv-python fastdeploy-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
+```
+
+#### Pythonの推論例
+
+* モデルや画像の準備
+
+```bash
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+```
+
+* 推論結果のテスト
+
+```python
+# GPU/TensorRTデプロイメントリファレンス examples/vision/detection/paddledetection/python
+import cv2
+import fastdeploy.vision as vision
+
+model = vision.detection.PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
+                                 "ppyoloe_crn_l_300e_coco/model.pdiparams",
+                                 "ppyoloe_crn_l_300e_coco/infer_cfg.yml")
+im = cv2.imread("000000014439.jpg")
+result = model.predict(im.copy())
+print(result)
+
+vis_im = vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("vis_image.jpg", vis_im)
+
+```
+
+</div></details>
+
+<div id="fastdeploy-quick-start-cpp"></div>
+
+<details close>
+
+<summary><b>C++ SDK クイックスタート（クリックで詳細表示）</b></summary><div>
+
+
+#### インストール
+
+- リファレンス [C++プリコンパイル版ライブラリダウンロード](docs/cn/build_and_install/download_prebuilt_libraries.md)文档  
+
+#### C++の推論例
+
+* モデルや画像の準備
+
+```bash
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+```
+
+* 推論結果のテスト
+
+```C++
+// GPU/TensorRTデプロイメントリファレンス examples/vision/detection/paddledetection/cpp
+#include "fastdeploy/vision.h"
+
+int main(int argc, char* argv[]) {
+  namespace vision = fastdeploy::vision;
+  auto model = vision::detection::PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
+                                          "ppyoloe_crn_l_300e_coco/model.pdiparams",
+                                          "ppyoloe_crn_l_300e_coco/infer_cfg.yml");
+  auto im = cv::imread("000000014439.jpg");
+
+  vision::DetectionResult res;
+  model.Predict(&im, &res);
+
+  auto vis_im = vision::Visualize::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_image.jpg", vis_im);
+  return 0;
+}
+```
+
+</div></details>
+
+その他の展開例については、[モデルの展開例]を参照してください(examples) .
+
+<div id="fastdeploy-server-models"></div>
+
+### サーバーサイドの対応機種一覧  🔥🔥🔥🔥🔥
+
+表記: (1)  ✅: 対応済み; (2) ❔:進行中 ; (3) N/A: 未対応; <br>
+
+<details open><summary><b> サーバーサイドモデル対応一覧（クリックで縮小します）</b></summary><div>
+
+<div align="center">
+  <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png"/>
+</div>
+
+| ミッションシナリオ                   | モデル                                                                                         | Linux                                            | Linux      | Win     | Win        | Mac     | Mac     | Linux       | Linux           | Linux         | Linux         | Linux   |
+|:----------------------:|:--------------------------------------------------------------------------------------------:|:------------------------------------------------:|:----------:|:-------:|:----------:|:-------:|:-------:|:-----------:|:---------------:|:-------------:|:-------------:|:-------:|
+| ---                    | ---                                                                                          | X86 CPU                                          | NVIDIA GPU | X86 CPU | NVIDIA GPU | X86 CPU | Arm CPU | AArch64 CPU |  Phytium D2000CPU | NVIDIA Jetson | Graphcore IPU | Serving |
+| Classification         | [PaddleClas/ResNet50](./examples/vision/classification/paddleclas)                           | [✅](./examples/vision/classification/paddleclas) | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [TorchVison/ResNet](examples/vision/classification/resnet)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Classification         | [ltralytics/YOLOv5Cls](examples/vision/classification/yolov5cls)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Classification         | [PaddleClas/PP-LCNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/PP-LCNetv2](./examples/vision/classification/paddleclas)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/EfficientNet](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/GhostNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV1](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV2](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/ShuffleNetV2](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/SqueeezeNetV1.1](./examples/vision/classification/paddleclas)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/Inceptionv3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Classification         | [PaddleClas/PP-HGNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOE](./examples/vision/detection/paddledetection)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PicoDet](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/YOLOX](./examples/vision/detection/paddledetection)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅               | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/YOLOv3](./examples/vision/detection/paddledetection)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLO](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOv2](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/Faster-RCNN](./examples/vision/detection/paddledetection)                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/Mask-RCNN](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [Megvii-BaseDetection/YOLOX](./examples/vision/detection/yolox)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7](./examples/vision/detection/yolov7)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_trt](./examples/vision/detection/yolov7end2end_trt)                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_ort_](./examples/vision/detection/yolov7end2end_ort)               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [meituan/YOLOv6](./examples/vision/detection/yolov6)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [ultralytics/YOLOv5](./examples/vision/detection/yolov5)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [WongKinYiu/YOLOR](./examples/vision/detection/yolor)                                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/ScaledYOLOv4](./examples/vision/detection/scaledyolov4)                          | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [ppogg/YOLOv5Lite](./examples/vision/detection/yolov5lite)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [RangiLyu/NanoDetPlus](./examples/vision/detection/nanodet_plus)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| KeyPoint               | [PaddleDetection/TinyPose](./examples/vision/keypointdetection/tiny_pose)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| KeyPoint               | [PaddleDetection/PicoDet + TinyPose](./examples/vision/keypointdetection/det_keypoint_unite) | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| HeadPose               | [omasaht/headpose](examples/vision/headpose)                                                 | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Tracking               | [PaddleDetection/PP-Tracking](examples/vision/tracking/pptracking)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv2](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv3](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Segmentation           | [PaddleSeg/PP-LiteSeg](./examples/vision/segmentation/paddleseg)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegLite](./examples/vision/segmentation/paddleseg)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/HRNet](./examples/vision/segmentation/paddleseg)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegServer](./examples/vision/segmentation/paddleseg)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/Unet](./examples/vision/segmentation/paddleseg)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/Deeplabv3](./examples/vision/segmentation/paddleseg)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [biubug6/RetinaFace](./examples/vision/facedet/retinaface)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [Linzaer/UltraFace](./examples/vision/facedet/ultraface)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [deepcam-cn/YOLOv5Face](./examples/vision/facedet/yolov5face)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [insightface/SCRFD](./examples/vision/facedet/scrfd)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [Hsintao/PFLD](examples/vision/facealign/pfld)                                               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [Single430FaceLandmark1000](./examples/vision/facealign/face_landmark_1000)                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [jhb86253817/PIPNet](./examples/vision/facealign)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/ArcFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/CosFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/PartialFC](./examples/vision/faceid/insightface)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/VPL](./examples/vision/faceid/insightface)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [ZHKKKe/MODNet](./examples/vision/matting/modnet)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Matting                | [PeterL1n/RobustVideoMatting]()                                                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/PP-Matting](./examples/vision/matting/ppmatting)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/PP-HumanMatting](./examples/vision/matting/modnet)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/ModNet](./examples/vision/matting/modnet)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/BasicVSR](./)                                                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/EDVR](./examples/vision/sr/edvr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/PP-MSVSR](./examples/vision/sr/ppmsvsr)                                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Information Extraction | [PaddleNLP/UIE](./examples/text/uie)                                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           |         |
+| NLP                    | [PaddleNLP/ERNIE-3.0](./examples/text/ernie-3.0)                                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | ❔                           | ✅       |
+| Speech                 | [PaddleSpeech/PP-TTS](./examples/audio/pp-tts)                                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | --                          | ✅       |
+
+
+</div></details>
+
+<div id="fastdeploy-edge-doc"></div>
+
+## 📲 モバイルとエンドサイドの展開 🔥🔥🔥🔥
+
+<div id="fastdeploy-edge-models"></div>
+
+### エンドユーザーモデル対応表
+<details open><summary><b> エンドユーザーモデル対応表(クリックで縮小)</b></summary><div>
+
+<div align="center">
+  <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png"  />
+</div>
+
+| ミッションシナリオ              | モデル                                                                                        | サイズ(MB)   | Linux   | Android | Linux     | Linux                   | Linux                          | Linux                       | Linux                            | TBD...  |
+|:------------------:|:-----------------------------------------------------------------------------------------:|:--------:|:-------:|:-------:|:-------:|:-----------------------:|:------------------------------:|:---------------------------:|:--------------------------------:|:-------:|
+| ---                | ---                                                                                       | ---      | ARM CPU | ARM CPU | Rockchip-NPU<br>RK3568/RK3588 | Rockchip-NPU<br>RV1109/RV1126/RK1808 |  Amlogic-NPU <br>A311D/S905D/C308X |  NXP-NPU<br>i.MX&nbsp;8M&nbsp;Plus | TBD...｜ |
+| Classification     | [PaddleClas/ResNet50](examples/vision/classification/paddleclas)                         | 98        | ✅       | ✅       |  ❔                             |      ✅                                |                                   |                                   |         |
+| Classification     | [PaddleClas/PP-LCNet](examples/vision/classification/paddleclas)                         | 11.9      | ✅       | ✅       | ❔                             | ✅                                 | --                                | --                                | --      |
+| Classification     | [PaddleClas/PP-LCNetv2](examples/vision/classification/paddleclas)                       | 26.6      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/EfficientNet](examples/vision/classification/paddleclas)                     | 31.4      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/GhostNet](examples/vision/classification/paddleclas)                         | 20.8      | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV1](examples/vision/classification/paddleclas)                      | 17        | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV2](examples/vision/classification/paddleclas)                      | 14.2      | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV3](examples/vision/classification/paddleclas)                      | 22        | ✅       | ✅       | ❔                             | ✅                                    | ❔                                 | ❔                                 | --      |
+| Classification     | [PaddleClas/ShuffleNetV2](examples/vision/classification/paddleclas)                     | 9.2       | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/SqueezeNetV1.1](examples/vision/classification/paddleclas)                   | 5         | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/Inceptionv3](examples/vision/classification/paddleclas)                      | 95.5      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/PP-HGNet](examples/vision/classification/paddleclas)                         | 59        | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Detection          | [PaddleDetection/PP-PicoDet_s_320_coco_lcnet](examples/vision/detection/paddledetection) | 4.9       | ✅       | ✅       | ✅                             | ✅                                    | ✅                                 | ✅                                 | --      |
+| Face Detection     | [deepinsight/SCRFD](./examples/vision/facedet/scrfd)                                     | 2.5       | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Keypoint Detection | [PaddleDetection/PP-TinyPose](examples/vision/keypointdetection/tiny_pose)               | 5.5       | ✅       | ✅       | ❔                             | ❔                                    | ❔                                 | ❔                                 | --      |
+| Segmentation       | [PaddleSeg/PP-LiteSeg(STDC1)](examples/vision/segmentation/paddleseg)                    | 32.2      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/PP-HumanSeg-Lite](examples/vision/segmentation/paddleseg)                     | 0.556     | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/HRNet-w18](examples/vision/segmentation/paddleseg)                            | 38.7      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/PP-HumanSeg](examples/vision/segmentation/paddleseg)                          | 107.2     | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/Unet](examples/vision/segmentation/paddleseg)                                 | 53.7      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/Deeplabv3](examples/vision/segmentation/paddleseg)                            | 150       | ❔       | ✅       | ✅                             |                                      |                                   |                                   |         |
+| OCR                | [PaddleOCR/PP-OCRv2](examples/vision/ocr/PP-OCRv2)                                       | 2.3+4.4   | ✅       | ✅       | ❔                             | --                                   | --                                | --                                | --      |
+| OCR                | [PaddleOCR/PP-OCRv3](examples/vision/ocr/PP-OCRv3)                                       | 2.4+10.6  | ✅       | ❔       | ❔                             | ❔                                    | ❔                                 | ❔                                 | --      |
+
+
+</div></details>
+
+## 🌐 🌐 Webとアプレットのデプロイメント
+
+<div id="fastdeploy-web-models"></div>
+
+<details open><summary><b> ウェブ・アプレット展開サポートリスト(クリックで縮小)</b></summary><div>
+
+| ミッションシナリオ               | モデル                                                                                         | [web_demo](examples/application/js/web_demo) |
+|:------------------:|:-------------------------------------------------------------------------------------------:|:--------------------------------------------:|
+| ---                | ---                                                                                         | [Paddle.js](examples/application/js)         |
+| Detection          | [FaceDetection](examples/application/js/web_demo/src/pages/cv/detection)                    | ✅                                            |
+| Detection          | [ScrewDetection](examples/application/js/web_demo/src/pages/cv/detection)                   | ✅                                            |
+| Segmentation       | [PaddleSeg/HumanSeg](./examples/application/js/web_demo/src/pages/cv/segmentation/HumanSeg) | ✅                                            |
+| Object Recognition | [GestureRecognition](examples/application/js/web_demo/src/pages/cv/recognition)             | ✅                                            |
+| Object Recognition | [ItemIdentification](examples/application/js/web_demo/src/pages/cv/recognition)             | ✅                                            |
+| OCR                | [PaddleOCR/PP-OCRv3](./examples/application/js/web_demo/src/pages/cv/ocr)                   | ✅                                            |
+
+</div></details>
+
+
+<div id="fastdeploy-acknowledge"></div>
+
+## Acknowledge
+
+このプロジェクトでは、SDKの生成とダウンロードに [EasyEdge](https://ai.baidu.com/easyedge/app/openSource) の無償かつオープンな機能を利用しており、そのことに謝意を表したいと思います。
+
+## License
+
+<div id="fastdeploy-license"></div>
+
+FastDeploy は、[Apache-2.0 オープンソースプロトコル] (./LICENSE)に従っています。

From 4f4f72fa18a2b9619c0b3f4a1ed8d0a822014856 Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Tue, 13 Dec 2022 16:38:12 +0800
Subject: [PATCH 35/77] Add files via upload

---
 docs/docs_i18n/README_Ру́сский_язы́к.md | 334 +++++++++++++++++++++++++
 docs/docs_i18n/README_हिन्दी.md        | 334 +++++++++++++++++++++++++
 docs/docs_i18n/README_한국어.md       | 335 ++++++++++++++++++++++++++
 3 files changed, 1003 insertions(+)
 create mode 100644 docs/docs_i18n/README_Ру́сский_язы́к.md
 create mode 100644 docs/docs_i18n/README_हिन्दी.md
 create mode 100644 docs/docs_i18n/README_한국어.md

diff --git a/docs/docs_i18n/README_Ру́сский_язы́к.md b/docs/docs_i18n/README_Ру́сский_язы́к.md
new file mode 100644
index 000000000..29045dd45
--- /dev/null
+++ b/docs/docs_i18n/README_Ру́сский_язы́к.md
@@ -0,0 +1,334 @@
+[English](../../README_EN.md) | [简体中文](../../README_CN.md) | [हिन्दी](./README_हिन्दी.md) | [日本語](./README_日本語.md) | [한국인](./README_한국어.md) | Pу́сский язы́к
+
+![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)
+
+</p>
+
+<p align="center">
+    <a href="./LICENSE"><img src="https://img.shields.io/badge/license-Apache%202-dfd.svg"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/releases"><img src="https://img.shields.io/github/v/release/PaddlePaddle/FastDeploy?color=ffa"></a>
+    <a href=""><img src="https://img.shields.io/badge/python-3.7+-aff.svg"></a>
+    <a href=""><img src="https://img.shields.io/badge/os-linux%2C%20win%2C%20mac-pink.svg"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/graphs/contributors"><img src="https://img.shields.io/github/contributors/PaddlePaddle/FastDeploy?color=9ea"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/commits"><img src="https://img.shields.io/github/commit-activity/m/PaddlePaddle/FastDeploy?color=3af"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/issues"><img src="https://img.shields.io/github/issues/PaddlePaddle/FastDeploy?color=9cc"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/stargazers"><img src="https://img.shields.io/github/stars/PaddlePaddle/FastDeploy?color=ccf"></a>
+</p>
+
+<p align="center">
+    <a href="/docs/cn/build_and_install"><b> Установка </b></a>
+    |
+    <a href="docs/README_CN.md"><b> Использование документации </b></a>
+    |
+    <a href="https://baidu-paddle.github.io/fastdeploy-api/"><b> API документация </b></a>
+    |
+    <a href="https://github.com/PaddlePaddle/FastDeploy/releases"><b> Журнал обновления </b></a>
+</p>
+
+**⚡️FastDeploy**- это**всесценарный**,**простой в использовании и гибкий**,**чрезвычайно эффективный**инструмент развертывания выводов ИИ. Он обеспечивает 📦**из коробки**опыт развертывания с поддержкой более 🔥150+ **текстовых**,**зрительных**, **речевых** и **кросс-модальных** моделей и 🔚 **сквозной** оптимизацией производительности вывода. Сюда входят классификация изображений, обнаружение объектов, сегментация изображений, обнаружение лиц, распознавание лиц, обнаружение ключевых точек, распознавание ключей, OCR, NLP, TTS и другие задачи для удовлетворения потребностей разработчиков с **многосценическими, многоаппаратными, многоплатформенными** промышленными развертываниями.
+| [Image Classification](examples/vision/classification)                                                                                         | [Object Detection](examples/vision/detection)                                                                                                  | [Semantic Segmentation](examples/vision/segmentation/paddleseg)                                                                                  | [Potrait Segmentation](examples/vision/segmentation/paddleseg)                                                                                                                                                                                                                                                                                                           |
+|:----------------------------------------------------------------------------------------------------------------------------------------------:|:----------------------------------------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|
+| <img src='https://user-images.githubusercontent.com/54695910/200465949-da478e1b-21ce-43b8-9f3f-287460e786bd.png' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054680-2f8d1952-c120-4b67-88fc-7d2d7d2378b4.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054711-6119f0e7-d741-43b1-b273-9493d103d49f.gif' height="126px" width="190px">   | <img src='https://user-images.githubusercontent.com/54695910/188054718-6395321c-8937-4fa0-881c-5b20deb92aaa.gif' height="126px" width="190px">                                                                                                                                                                                                                           |
+| [**Image Matting**](examples/vision/matting)                                                                                                   | [**Real-Time Matting**](examples/vision/matting)                                                                                               | [**OCR**](examples/vision/ocr)                                                                                                                   | [**Face Alignment**](examples/vision/facealign)                                                                                                                                                                                                                                                                                                                          |
+| <img src='https://user-images.githubusercontent.com/54695910/188058231-a5fe1ce1-0a38-460f-9582-e0b881514908.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054691-e4cb1a70-09fe-4691-bc62-5552d50bd853.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054669-a85996ba-f7f3-4646-ae1f-3b7e3e353e7d.gif' height="126px" width="190px"  > | <img src='https://user-images.githubusercontent.com/54695910/188059460-9845e717-c30a-4252-bd80-b7f6d4cf30cb.png' height="126px" width="190px">                                                                                                                                                                                                                           |
+| [**Pose Estimation**](examples/vision/keypointdetection)                                                                                       | [**Behavior Recognition**](https://github.com/PaddlePaddle/FastDeploy/issues/6)                                                                | [**NLP**](examples/text)                                                                                                                         | [**Speech**](examples/audio/pp-tts)                                                                                                                                                                                                                                                                                                                                      |
+| <img src='https://user-images.githubusercontent.com/54695910/188054671-394db8dd-537c-42b1-9d90-468d7ad1530e.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/48054808/173034825-623e4f78-22a5-4f14-9b83-dc47aa868478.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/200162475-f5d85d70-18fb-4930-8e7e-9ca065c1d618.gif' height="126px" width="190px">   | <p align="left">**input** ：早上好今天是2020<br>/10/29，最低温度是-3°C。<br><br> <p align="left">**output**: [<img src="https://user-images.githubusercontent.com/54695910/200161645-871e08da-5a31-4736-879c-a88bb171a676.png" width="170" style="max-width: 100%;">](https://paddlespeech.bj.bcebos.com/Parakeet/docs/demos/parakeet_espnet_fs2_pwg_demo/tn_g2p/parakeet/001.wav)</p> |
+
+
+## **Обмен сообществами**
+
+*  **Slack**：Join our [Slack community](https://join.slack.com/t/fastdeployworkspace/shared_invite/zt-1jznah134-3rxY~ytRb8rcPqkn9g~PDg) and chat with other community members about ideas
+
+*  **WeChat**: Отсканируйте QR-код и заполните анкету, чтобы присоединиться к техническому сообществу и обсудить болевые точки развертывания и решения с разработчиками сообщества
+
+<div align="center">
+    <img src="https://user-images.githubusercontent.com/54695910/200145290-d5565d18-6707-4a0b-a9af-85fd36d35d13.jpg" width = "220" height = "220" />
+</div>
+
+## Каталог
+
+* **🖥️Развертывание на стороне сервера**
+
+  * [Python SDK Quick Start](#fastdeploy-quick-start-python)  
+  * [C++ SDK Quick Start](#fastdeploy-quick-start-cpp)
+  * [Список поддержки моделей на стороне сервера](#fastdeploy-server-models)
+
+* **📲 Мобильные и конечные развертывания**
+
+  * [Список поддержки конечных моделей](#fastdeploy-edge-models)
+
+* **🌐 Развертывание веб и апплетов**  
+
+  * [Список поддержки веб-моделей](#fastdeploy-web-models)
+* [Acknowledge](#fastdeploy-acknowledge)  
+* [License](#fastdeploy-license)
+
+## 🖥️ Развертывание на стороне сервера
+
+<div id="fastdeploy-quick-start-python"></div>
+
+<details close>
+
+<summary><b> Быстрый старт Python SDK (нажмите для получения подробной информации)</b></summary><div>
+
+#### Быстрая установка
+
+##### Предварительные зависимости
+
+- CUDA >= 11.2、cuDNN >= 8.0、Python >= 3.6
+- OS: Linux x86_64/macOS/Windows 10
+
+##### Установка версии GPU
+
+```bash
+pip install numpy opencv-python fastdeploy-gpu-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
+```
+
+##### [установка Conda (рекомендуется)](docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+```bash
+conda config --add channels conda-forge && conda install cudatoolkit=11.2 cudnn=8.2
+```
+
+#####  Установка CPU процессора
+
+```bash
+pip install numpy opencv-python fastdeploy-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
+```
+
+#### Пример умозаключения в Python 
+
+* Подготовка модели и изображений 
+
+```bash
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+```
+
+* Проверка результатов вывода
+
+```python
+# GPU/TensorRT Справочник по развертыванию examples/vision/detection/paddledetection/python
+import cv2
+import fastdeploy.vision as vision
+
+model = vision.detection.PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
+                                 "ppyoloe_crn_l_300e_coco/model.pdiparams",
+                                 "ppyoloe_crn_l_300e_coco/infer_cfg.yml")
+im = cv2.imread("000000014439.jpg")
+result = model.predict(im.copy())
+print(result)
+
+vis_im = vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("vis_image.jpg", vis_im)
+
+```
+
+</div></details>
+
+<div id="fastdeploy-quick-start-cpp"></div>
+
+<details close>
+
+<summary><b> C++ SDK Quick Start (нажмите для получения подробной информации)</b></summary><div>
+
+
+#### Установка 
+
+Обратитесь к документации [C++ prebuilt libraries download](docs/cn/build_and_install/download_prebuilt_libraries.md) 
+
+#### Пример вывода в C++
+
+* Подготовка моделей и фотографий
+
+```bash
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+```
+
+* Результаты рассуждений при тестировании
+
+```C++
+// GPU/TensorRT Ссылка на развертывание examples/vision/detection/paddledetection/cpp
+#include "fastdeploy/vision.h"
+
+int main(int argc, char* argv[]) {
+  namespace vision = fastdeploy::vision;
+  auto model = vision::detection::PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
+                                          "ppyoloe_crn_l_300e_coco/model.pdiparams",
+                                          "ppyoloe_crn_l_300e_coco/infer_cfg.yml");
+  auto im = cv::imread("000000014439.jpg");
+
+  vision::DetectionResult res;
+  model.Predict(&im, &res);
+
+  auto vis_im = vision::Visualize::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_image.jpg", vis_im);
+  return 0;
+}
+```
+
+</div></details>
+
+Дополнительные примеры развертывания см. в разделе [Примеры развертывания модели] (examples).
+
+<div id="fastdeploy-server-models"></div>
+
+### Список поддержки моделей на стороне сервера🔥🔥🔥🔥🔥
+
+Описание символов: (1)  ✅: Уже поддерживается; (2) ❔:Текущий; (3) N/A:В настоящее время не поддерживается;<br>
+
+<details open><summary><b> Список поддержки моделей на стороне сервера (нажмите, чтобы уменьшить)</b></summary><div>
+
+<div align="center">
+  <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png"/>
+</div>
+
+| Сценарии миссий                 | Модели                                                                                        | Linux                                            | Linux      | Win     | Win        | Mac     | Mac     | Linux       | Linux           | Linux         | Linux         | Linux   |
+|:----------------------:|:--------------------------------------------------------------------------------------------:|:------------------------------------------------:|:----------:|:-------:|:----------:|:-------:|:-------:|:-----------:|:---------------:|:-------------:|:-------------:|:-------:|
+| ---                    | ---                                                                                          | X86 CPU                                          | NVIDIA GPU | X86 CPU | NVIDIA GPU | X86 CPU | Arm CPU | AArch64 CPU |  Phytium D2000CPU | NVIDIA Jetson | Graphcore IPU | Serving |
+| Classification         | [PaddleClas/ResNet50](./examples/vision/classification/paddleclas)                           | [✅](./examples/vision/classification/paddleclas) | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [TorchVison/ResNet](examples/vision/classification/resnet)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Classification         | [ltralytics/YOLOv5Cls](examples/vision/classification/yolov5cls)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Classification         | [PaddleClas/PP-LCNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/PP-LCNetv2](./examples/vision/classification/paddleclas)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/EfficientNet](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/GhostNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV1](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV2](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/ShuffleNetV2](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/SqueeezeNetV1.1](./examples/vision/classification/paddleclas)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/Inceptionv3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Classification         | [PaddleClas/PP-HGNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOE](./examples/vision/detection/paddledetection)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PicoDet](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/YOLOX](./examples/vision/detection/paddledetection)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅               | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/YOLOv3](./examples/vision/detection/paddledetection)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLO](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOv2](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/Faster-RCNN](./examples/vision/detection/paddledetection)                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/Mask-RCNN](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [Megvii-BaseDetection/YOLOX](./examples/vision/detection/yolox)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7](./examples/vision/detection/yolov7)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_trt](./examples/vision/detection/yolov7end2end_trt)                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_ort_](./examples/vision/detection/yolov7end2end_ort)               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [meituan/YOLOv6](./examples/vision/detection/yolov6)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [ultralytics/YOLOv5](./examples/vision/detection/yolov5)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [WongKinYiu/YOLOR](./examples/vision/detection/yolor)                                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/ScaledYOLOv4](./examples/vision/detection/scaledyolov4)                          | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [ppogg/YOLOv5Lite](./examples/vision/detection/yolov5lite)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [RangiLyu/NanoDetPlus](./examples/vision/detection/nanodet_plus)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| KeyPoint               | [PaddleDetection/TinyPose](./examples/vision/keypointdetection/tiny_pose)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| KeyPoint               | [PaddleDetection/PicoDet + TinyPose](./examples/vision/keypointdetection/det_keypoint_unite) | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| HeadPose               | [omasaht/headpose](examples/vision/headpose)                                                 | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Tracking               | [PaddleDetection/PP-Tracking](examples/vision/tracking/pptracking)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv2](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv3](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Segmentation           | [PaddleSeg/PP-LiteSeg](./examples/vision/segmentation/paddleseg)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegLite](./examples/vision/segmentation/paddleseg)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/HRNet](./examples/vision/segmentation/paddleseg)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegServer](./examples/vision/segmentation/paddleseg)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/Unet](./examples/vision/segmentation/paddleseg)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/Deeplabv3](./examples/vision/segmentation/paddleseg)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [biubug6/RetinaFace](./examples/vision/facedet/retinaface)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [Linzaer/UltraFace](./examples/vision/facedet/ultraface)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [deepcam-cn/YOLOv5Face](./examples/vision/facedet/yolov5face)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [insightface/SCRFD](./examples/vision/facedet/scrfd)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [Hsintao/PFLD](examples/vision/facealign/pfld)                                               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [Single430FaceLandmark1000](./examples/vision/facealign/face_landmark_1000)                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [jhb86253817/PIPNet](./examples/vision/facealign)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/ArcFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/CosFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/PartialFC](./examples/vision/faceid/insightface)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/VPL](./examples/vision/faceid/insightface)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [ZHKKKe/MODNet](./examples/vision/matting/modnet)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Matting                | [PeterL1n/RobustVideoMatting]()                                                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/PP-Matting](./examples/vision/matting/ppmatting)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/PP-HumanMatting](./examples/vision/matting/modnet)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/ModNet](./examples/vision/matting/modnet)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/BasicVSR](./)                                                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/EDVR](./examples/vision/sr/edvr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/PP-MSVSR](./examples/vision/sr/ppmsvsr)                                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Information Extraction | [PaddleNLP/UIE](./examples/text/uie)                                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           |         |
+| NLP                    | [PaddleNLP/ERNIE-3.0](./examples/text/ernie-3.0)                                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | ❔                           | ✅       |
+| Speech                 | [PaddleSpeech/PP-TTS](./examples/audio/pp-tts)                                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | --                          | ✅       |
+
+
+</div></details>
+
+<div id="fastdeploy-edge-doc"></div>
+
+## 📲 Мобильное и конечное развертывание  🔥🔥🔥🔥
+
+<div id="fastdeploy-edge-models"></div>
+
+### Список поддержки конечных моделей
+<details open><summary><b>  Список поддержки конечных моделей (нажмите, чтобы уменьшить)</b></summary><div>
+
+<div align="center">
+  <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png"  />
+</div>
+
+| Сценарии миссий             | Модели                                                                                       | Размер(MB)   | Linux   | Android | Linux     | Linux                   | Linux                          | Linux                       | Linux                            | TBD...  |
+|:------------------:|:-----------------------------------------------------------------------------------------:|:--------:|:-------:|:-------:|:-------:|:-----------------------:|:------------------------------:|:---------------------------:|:--------------------------------:|:-------:|
+| ---                | ---                                                                                       | ---      | ARM CPU | ARM CPU | Rockchip-NPU<br>RK3568/RK3588 | Rockchip-NPU<br>RV1109/RV1126/RK1808 |  Amlogic-NPU <br>A311D/S905D/C308X |  NXP-NPU<br>i.MX&nbsp;8M&nbsp;Plus | TBD...｜ |
+| Classification     | [PaddleClas/ResNet50](examples/vision/classification/paddleclas)                         | 98        | ✅       | ✅       |  ❔                             |      ✅                                |                                   |                                   |         |
+| Classification     | [PaddleClas/PP-LCNet](examples/vision/classification/paddleclas)                         | 11.9      | ✅       | ✅       | ❔                             | ✅                                 | --                                | --                                | --      |
+| Classification     | [PaddleClas/PP-LCNetv2](examples/vision/classification/paddleclas)                       | 26.6      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/EfficientNet](examples/vision/classification/paddleclas)                     | 31.4      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/GhostNet](examples/vision/classification/paddleclas)                         | 20.8      | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV1](examples/vision/classification/paddleclas)                      | 17        | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV2](examples/vision/classification/paddleclas)                      | 14.2      | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV3](examples/vision/classification/paddleclas)                      | 22        | ✅       | ✅       | ❔                             | ✅                                    | ❔                                 | ❔                                 | --      |
+| Classification     | [PaddleClas/ShuffleNetV2](examples/vision/classification/paddleclas)                     | 9.2       | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/SqueezeNetV1.1](examples/vision/classification/paddleclas)                   | 5         | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/Inceptionv3](examples/vision/classification/paddleclas)                      | 95.5      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/PP-HGNet](examples/vision/classification/paddleclas)                         | 59        | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Detection          | [PaddleDetection/PP-PicoDet_s_320_coco_lcnet](examples/vision/detection/paddledetection) | 4.9       | ✅       | ✅       | ✅                             | ✅                                    | ✅                                 | ✅                                 | --      |
+| Face Detection     | [deepinsight/SCRFD](./examples/vision/facedet/scrfd)                                     | 2.5       | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Keypoint Detection | [PaddleDetection/PP-TinyPose](examples/vision/keypointdetection/tiny_pose)               | 5.5       | ✅       | ✅       | ❔                             | ❔                                    | ❔                                 | ❔                                 | --      |
+| Segmentation       | [PaddleSeg/PP-LiteSeg(STDC1)](examples/vision/segmentation/paddleseg)                    | 32.2      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/PP-HumanSeg-Lite](examples/vision/segmentation/paddleseg)                     | 0.556     | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/HRNet-w18](examples/vision/segmentation/paddleseg)                            | 38.7      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/PP-HumanSeg](examples/vision/segmentation/paddleseg)                          | 107.2     | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/Unet](examples/vision/segmentation/paddleseg)                                 | 53.7      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/Deeplabv3](examples/vision/segmentation/paddleseg)                            | 150       | ❔       | ✅       | ✅                             |                                      |                                   |                                   |         |
+| OCR                | [PaddleOCR/PP-OCRv2](examples/vision/ocr/PP-OCRv2)                                       | 2.3+4.4   | ✅       | ✅       | ❔                             | --                                   | --                                | --                                | --      |
+| OCR                | [PaddleOCR/PP-OCRv3](examples/vision/ocr/PP-OCRv3)                                       | 2.4+10.6  | ✅       | ❔       | ❔                             | ❔                                    | ❔                                 | ❔                                 | --      |
+
+
+</div></details>
+
+## 🌐 🌐 Развертывание веб и апплетов
+
+<div id="fastdeploy-web-models"></div>
+
+<details open><summary><b> Список поддержки развертывания веб-приложений и апплетов (нажмите, чтобы уменьшить)</b></summary><div>
+
+| Сценарии миссий              | Модели                                                                                          | [web_demo](examples/application/js/web_demo) |
+|:------------------:|:-------------------------------------------------------------------------------------------:|:--------------------------------------------:|
+| ---                | ---                                                                                         | [Paddle.js](examples/application/js)         |
+| Detection          | [FaceDetection](examples/application/js/web_demo/src/pages/cv/detection)                    | ✅                                            |
+| Detection          | [ScrewDetection](examples/application/js/web_demo/src/pages/cv/detection)                   | ✅                                            |
+| Segmentation       | [PaddleSeg/HumanSeg](./examples/application/js/web_demo/src/pages/cv/segmentation/HumanSeg) | ✅                                            |
+| Object Recognition | [GestureRecognition](examples/application/js/web_demo/src/pages/cv/recognition)             | ✅                                            |
+| Object Recognition | [ItemIdentification](examples/application/js/web_demo/src/pages/cv/recognition)             | ✅                                            |
+| OCR                | [PaddleOCR/PP-OCRv3](./examples/application/js/web_demo/src/pages/cv/ocr)                   | ✅                                            |
+
+</div></details>
+
+
+<div id="fastdeploy-acknowledge"></div>
+
+## Acknowledge
+
+Для создания и загрузки SDK в этом проекте используются бесплатные и открытые возможности в [EasyEdge](https://ai.baidu.com/easyedge/app/openSource), за что мы хотели бы поблагодарить вас.
+
+## License
+
+<div id="fastdeploy-license"></div>
+
+FastDeploy следует [протоколу Apache-2.0 с открытым исходным кодом](. /LICENSE).
diff --git a/docs/docs_i18n/README_हिन्दी.md b/docs/docs_i18n/README_हिन्दी.md
new file mode 100644
index 000000000..46113bee8
--- /dev/null
+++ b/docs/docs_i18n/README_हिन्दी.md
@@ -0,0 +1,334 @@
+[English](../../README_EN.md) | [简体中文](../../README_CN.md) | हिन्दी | [日本語](./README_日本語.md) | [한국인](./README_한국어.md) | [Pу́сский язы́к](.//README_Ру́сский_язы́к.md)
+
+![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)
+
+</p>
+
+<p align="center">
+    <a href="./LICENSE"><img src="https://img.shields.io/badge/license-Apache%202-dfd.svg"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/releases"><img src="https://img.shields.io/github/v/release/PaddlePaddle/FastDeploy?color=ffa"></a>
+    <a href=""><img src="https://img.shields.io/badge/python-3.7+-aff.svg"></a>
+    <a href=""><img src="https://img.shields.io/badge/os-linux%2C%20win%2C%20mac-pink.svg"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/graphs/contributors"><img src="https://img.shields.io/github/contributors/PaddlePaddle/FastDeploy?color=9ea"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/commits"><img src="https://img.shields.io/github/commit-activity/m/PaddlePaddle/FastDeploy?color=3af"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/issues"><img src="https://img.shields.io/github/issues/PaddlePaddle/FastDeploy?color=9cc"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/stargazers"><img src="https://img.shields.io/github/stars/PaddlePaddle/FastDeploy?color=ccf"></a>
+</p>
+
+<p align="center">
+    <a href="/docs/cn/build_and_install"><b> संस्थापन  </b></a>
+    |
+    <a href="docs/README_CN.md"><b> दस्तावेज़ीकरण का उपयोग करें </b></a>
+    |
+    <a href="https://baidu-paddle.github.io/fastdeploy-api/"><b> APIप्रलेखन </b></a>
+    |
+    <a href="https://github.com/PaddlePaddle/FastDeploy/releases"><b> चेंजलॉग </b></a>
+</p>
+
+**⚡️फास्टडिप्लोय**एक एआई अनुमान तैनाती उपकरण है जो **सभी परिदृश्य**, **उपयोग करने में आसान और लचीला** और **बेहद कुशल** है। एक📦**आउट-ऑफ-द-बॉक्स** **क्लाउड-एज** परिनियोजन अनुभव प्रदान करता  है, 🔥150+ से अधिक **टेक्स्ट**, **विजन**, **स्पीच** और **क्रॉस-मोडल** मॉडल का समर्थन करता है, और 🔚 **एंड-टू-एंड** अनुमान प्रदर्शन अनुकूलन को लागू करता है। डेवलपर्स की जरूरतों को पूरा करने के लिए छवि वर्गीकरण, ऑब्जेक्ट डिटेक्शन, छवि विभाजन, चेहरे का पता लगाने, चेहरे की पहचान, मुख्य बिंदु का पता लगाने, कटआउट, ओसीआर, एनएलपी, टीटीएस और अन्य कार्यों सहित **बहु-परिदृश्य, बहु-हार्डवेयर, बहु-मंच** उद्योग की तैनाती की जरूरत है।
+| [Image Classification](examples/vision/classification)                                                                                         | [Object Detection](examples/vision/detection)                                                                                                  | [Semantic Segmentation](examples/vision/segmentation/paddleseg)                                                                                  | [Potrait Segmentation](examples/vision/segmentation/paddleseg)                                                                                                                                                                                                                                                                                                           |
+|:----------------------------------------------------------------------------------------------------------------------------------------------:|:----------------------------------------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|
+| <img src='https://user-images.githubusercontent.com/54695910/200465949-da478e1b-21ce-43b8-9f3f-287460e786bd.png' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054680-2f8d1952-c120-4b67-88fc-7d2d7d2378b4.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054711-6119f0e7-d741-43b1-b273-9493d103d49f.gif' height="126px" width="190px">   | <img src='https://user-images.githubusercontent.com/54695910/188054718-6395321c-8937-4fa0-881c-5b20deb92aaa.gif' height="126px" width="190px">                                                                                                                                                                                                                           |
+| [**Image Matting**](examples/vision/matting)                                                                                                   | [**Real-Time Matting**](examples/vision/matting)                                                                                               | [**OCR**](examples/vision/ocr)                                                                                                                   | [**Face Alignment**](examples/vision/facealign)                                                                                                                                                                                                                                                                                                                          |
+| <img src='https://user-images.githubusercontent.com/54695910/188058231-a5fe1ce1-0a38-460f-9582-e0b881514908.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054691-e4cb1a70-09fe-4691-bc62-5552d50bd853.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054669-a85996ba-f7f3-4646-ae1f-3b7e3e353e7d.gif' height="126px" width="190px"  > | <img src='https://user-images.githubusercontent.com/54695910/188059460-9845e717-c30a-4252-bd80-b7f6d4cf30cb.png' height="126px" width="190px">                                                                                                                                                                                                                           |
+| [**Pose Estimation**](examples/vision/keypointdetection)                                                                                       | [**Behavior Recognition**](https://github.com/PaddlePaddle/FastDeploy/issues/6)                                                                | [**NLP**](examples/text)                                                                                                                         | [**Speech**](examples/audio/pp-tts)                                                                                                                                                                                                                                                                                                                                      |
+| <img src='https://user-images.githubusercontent.com/54695910/188054671-394db8dd-537c-42b1-9d90-468d7ad1530e.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/48054808/173034825-623e4f78-22a5-4f14-9b83-dc47aa868478.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/200162475-f5d85d70-18fb-4930-8e7e-9ca065c1d618.gif' height="126px" width="190px">   | <p align="left">**input** ：早上好今天是2020<br>/10/29，最低温度是-3°C。<br><br> <p align="left">**output**: [<img src="https://user-images.githubusercontent.com/54695910/200161645-871e08da-5a31-4736-879c-a88bb171a676.png" width="170" style="max-width: 100%;">](https://paddlespeech.bj.bcebos.com/Parakeet/docs/demos/parakeet_espnet_fs2_pwg_demo/tn_g2p/parakeet/001.wav)</p> |
+
+
+## **सामुदायिक संचार**
+
+*  **Slack**：Join our [Slack community](https://join.slack.com/t/fastdeployworkspace/shared_invite/zt-1jznah134-3rxY~ytRb8rcPqkn9g~PDg) and chat with other community members about ideas
+
+*  **वीचैट**: क्यूआर कोड स्कैन करें, तकनीकी समुदाय में शामिल होने के लिए प्रश्नावली भरें, और सामुदायिक डेवलपर्स के साथ तैनाती के दर्द बिंदुओं और समाधानों पर चर्चा करें
+
+<div align="center">
+    <img src="https://user-images.githubusercontent.com/54695910/200145290-d5565d18-6707-4a0b-a9af-85fd36d35d13.jpg" width = "220" height = "220" />
+</div>
+
+## डायरेक्टरी 
+
+* **🖥️ सर्वर-साइड परिनियोजन**
+
+  * [Python SDK एक त्वरित शुरुआत है](#fastdeploy-quick-start-python)  
+  * [C++ SDK एक त्वरित शुरुआत है](#fastdeploy-quick-start-cpp)
+  * [सर्वर-साइड मॉडल समर्थन सूची](#fastdeploy-server-models)
+
+* **📲 मोबाइल और एंड-साइड परिनियोजन**
+
+  * [एंड-साइड मॉडल समर्थन सूची](#fastdeploy-edge-models)
+
+* **🌐 और एप्लेट तैनाती**  
+
+  * [Web-साइड मॉडल समर्थन सूची](#fastdeploy-web-models)
+* [Acknowledge](#fastdeploy-acknowledge)  
+* [License](#fastdeploy-license)
+
+## 🖥️  सर्वर-साइड परिनियोजन 
+
+<div id="fastdeploy-quick-start-python"></div>
+
+<details close>
+
+<summary><b>पायथन एसडीके क्विक स्टार्ट (विवरण के लिए यहां क्लिक करें)</b></summary><div>
+
+#### त्वरित स्थापना 
+
+#####  पूर्व-निर्भरता 
+
+- CUDA >= 11.2、cuDNN >= 8.0、Python >= 3.6
+- OS: Linux x86_64/macOS/Windows 10
+
+##### संस्करण स्थापित करें 
+
+```bash
+pip install numpy opencv-python fastdeploy-gpu-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
+```
+
+##### [Conda स्थापना (अनुशंसित) ](docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+```bash
+conda config --add channels conda-forge && conda install cudatoolkit=11.2 cudnn=8.2
+```
+
+#####  CPU संस्करण स्थापित करें
+
+```bash
+pip install numpy opencv-python fastdeploy-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
+```
+
+#### Python अनुमान उदाहरण 
+
+*  मॉडल और चित्र तैयार करें
+
+```bash
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+```
+
+* परीक्षण अनुमान परिणाम 
+
+```python
+# GPU/TensorRT तैनाती संदर्भ examples/vision/detection/paddledetection/python
+import cv2
+import fastdeploy.vision as vision
+
+model = vision.detection.PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
+                                 "ppyoloe_crn_l_300e_coco/model.pdiparams",
+                                 "ppyoloe_crn_l_300e_coco/infer_cfg.yml")
+im = cv2.imread("000000014439.jpg")
+result = model.predict(im.copy())
+print(result)
+
+vis_im = vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("vis_image.jpg", vis_im)
+
+```
+
+</div></details>
+
+<div id="fastdeploy-quick-start-cpp"></div>
+
+<details close>
+
+<summary><b> C++ SDK त्वरित प्रारंभ (विवरण के लिए यहां क्लिक करें) </b></summary><div>
+
+
+#### संस्थापन 
+
+C++ SDK त्वरित प्रारंभ (विवरण के लिए क्लिक करें)(docs/cn/build_and_install/download_prebuilt_libraries.md)文档  
+
+#### C++ अनुमान उदाहरण 
+
+* मॉडल और चित्र तैयार करें 
+
+```bash
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+```
+
+* अनुमान परिणामों का परीक्षण करें 
+
+```C++
+// GPU/TensorRTपरिनियोजन संदर्भ examples/vision/detection/paddledetection/cpp
+#include "fastdeploy/vision.h"
+
+int main(int argc, char* argv[]) {
+  namespace vision = fastdeploy::vision;
+  auto model = vision::detection::PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
+                                          "ppyoloe_crn_l_300e_coco/model.pdiparams",
+                                          "ppyoloe_crn_l_300e_coco/infer_cfg.yml");
+  auto im = cv::imread("000000014439.jpg");
+
+  vision::DetectionResult res;
+  model.Predict(&im, &res);
+
+  auto vis_im = vision::Visualize::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_image.jpg", vis_im);
+  return 0;
+}
+```
+
+</div></details>
+
+अधिक परिनियोजन उदाहरणों के लिए, कृपया मॉडल परिनियोजन उदाहरण देखें(examples) .
+
+<div id="fastdeploy-server-models"></div>
+
+### सर्वर-साइड मॉडल समर्थन सूची  🔥🔥🔥🔥🔥
+
+प्रतीक विवरण: (1)  ✅: पहले से समर्थित; (2) ❔:गति पर ; (3) N/A: समर्थित नहीं; <br>
+
+<details open><summary><b> सर्वर-साइड मॉडल समर्थन सूची (ढहने के लिए क्लिक करें)</b></summary><div>
+
+<div align="center">
+  <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png"/>
+</div>
+
+| कार्य परिदृश्य                  | नमूना                                                                                            | Linux                                            | Linux      | Win     | Win        | Mac     | Mac     | Linux       | Linux           | Linux         | Linux         | Linux   |
+|:----------------------:|:--------------------------------------------------------------------------------------------:|:------------------------------------------------:|:----------:|:-------:|:----------:|:-------:|:-------:|:-----------:|:---------------:|:-------------:|:-------------:|:-------:|
+| ---                    | ---                                                                                          | X86 CPU                                          | NVIDIA GPU | X86 CPU | NVIDIA GPU | X86 CPU | Arm CPU | AArch64 CPU |  Phytium D2000CPU | NVIDIA Jetson | Graphcore IPU | Serving |
+| Classification         | [PaddleClas/ResNet50](./examples/vision/classification/paddleclas)                           | [✅](./examples/vision/classification/paddleclas) | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [TorchVison/ResNet](examples/vision/classification/resnet)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Classification         | [ltralytics/YOLOv5Cls](examples/vision/classification/yolov5cls)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Classification         | [PaddleClas/PP-LCNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/PP-LCNetv2](./examples/vision/classification/paddleclas)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/EfficientNet](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/GhostNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV1](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV2](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/ShuffleNetV2](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/SqueeezeNetV1.1](./examples/vision/classification/paddleclas)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/Inceptionv3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Classification         | [PaddleClas/PP-HGNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOE](./examples/vision/detection/paddledetection)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PicoDet](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/YOLOX](./examples/vision/detection/paddledetection)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅               | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/YOLOv3](./examples/vision/detection/paddledetection)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLO](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOv2](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/Faster-RCNN](./examples/vision/detection/paddledetection)                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/Mask-RCNN](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [Megvii-BaseDetection/YOLOX](./examples/vision/detection/yolox)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7](./examples/vision/detection/yolov7)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_trt](./examples/vision/detection/yolov7end2end_trt)                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_ort_](./examples/vision/detection/yolov7end2end_ort)               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [meituan/YOLOv6](./examples/vision/detection/yolov6)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [ultralytics/YOLOv5](./examples/vision/detection/yolov5)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [WongKinYiu/YOLOR](./examples/vision/detection/yolor)                                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/ScaledYOLOv4](./examples/vision/detection/scaledyolov4)                          | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [ppogg/YOLOv5Lite](./examples/vision/detection/yolov5lite)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [RangiLyu/NanoDetPlus](./examples/vision/detection/nanodet_plus)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| KeyPoint               | [PaddleDetection/TinyPose](./examples/vision/keypointdetection/tiny_pose)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| KeyPoint               | [PaddleDetection/PicoDet + TinyPose](./examples/vision/keypointdetection/det_keypoint_unite) | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| HeadPose               | [omasaht/headpose](examples/vision/headpose)                                                 | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Tracking               | [PaddleDetection/PP-Tracking](examples/vision/tracking/pptracking)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv2](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv3](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Segmentation           | [PaddleSeg/PP-LiteSeg](./examples/vision/segmentation/paddleseg)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegLite](./examples/vision/segmentation/paddleseg)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/HRNet](./examples/vision/segmentation/paddleseg)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegServer](./examples/vision/segmentation/paddleseg)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/Unet](./examples/vision/segmentation/paddleseg)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/Deeplabv3](./examples/vision/segmentation/paddleseg)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [biubug6/RetinaFace](./examples/vision/facedet/retinaface)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [Linzaer/UltraFace](./examples/vision/facedet/ultraface)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [deepcam-cn/YOLOv5Face](./examples/vision/facedet/yolov5face)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [insightface/SCRFD](./examples/vision/facedet/scrfd)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [Hsintao/PFLD](examples/vision/facealign/pfld)                                               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [Single430FaceLandmark1000](./examples/vision/facealign/face_landmark_1000)                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [jhb86253817/PIPNet](./examples/vision/facealign)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/ArcFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/CosFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/PartialFC](./examples/vision/faceid/insightface)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/VPL](./examples/vision/faceid/insightface)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [ZHKKKe/MODNet](./examples/vision/matting/modnet)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Matting                | [PeterL1n/RobustVideoMatting]()                                                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/PP-Matting](./examples/vision/matting/ppmatting)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/PP-HumanMatting](./examples/vision/matting/modnet)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/ModNet](./examples/vision/matting/modnet)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/BasicVSR](./)                                                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/EDVR](./examples/vision/sr/edvr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/PP-MSVSR](./examples/vision/sr/ppmsvsr)                                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Information Extraction | [PaddleNLP/UIE](./examples/text/uie)                                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           |         |
+| NLP                    | [PaddleNLP/ERNIE-3.0](./examples/text/ernie-3.0)                                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | ❔                           | ✅       |
+| Speech                 | [PaddleSpeech/PP-TTS](./examples/audio/pp-tts)                                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | --                          | ✅       |
+
+
+</div></details>
+
+<div id="fastdeploy-edge-doc"></div>
+
+## 📲  मोबाइल और एंड-साइड परिनियोजन  🔥🔥🔥🔥
+
+<div id="fastdeploy-edge-models"></div>
+
+### एंड-साइड मॉडल समर्थन सूची
+<details open><summary><b>  एंड-साइड मॉडल समर्थन सूची (पतन के लिए क्लिक करें)</b></summary><div>
+
+<div align="center">
+  <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png"  />
+</div>
+
+| कार्य परिदृश्य              | नमूना                                                                                           | आकार(MB)   | Linux   | Android | Linux     | Linux                   | Linux                          | Linux                       | Linux                            | TBD...  |
+|:------------------:|:-----------------------------------------------------------------------------------------:|:--------:|:-------:|:-------:|:-------:|:-----------------------:|:------------------------------:|:---------------------------:|:--------------------------------:|:-------:|
+| ---                | ---                                                                                       | ---      | ARM CPU | ARM CPU | Rockchip-NPU<br>RK3568/RK3588 | Rockchip-NPU<br>RV1109/RV1126/RK1808 |  Amlogic-NPU <br>A311D/S905D/C308X |  NXP-NPU<br>i.MX&nbsp;8M&nbsp;Plus | TBD...｜ |
+| Classification     | [PaddleClas/ResNet50](examples/vision/classification/paddleclas)                         | 98        | ✅       | ✅       |  ❔                             |      ✅                                |                                   |                                   |         |
+| Classification     | [PaddleClas/PP-LCNet](examples/vision/classification/paddleclas)                         | 11.9      | ✅       | ✅       | ❔                             | ✅                                 | --                                | --                                | --      |
+| Classification     | [PaddleClas/PP-LCNetv2](examples/vision/classification/paddleclas)                       | 26.6      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/EfficientNet](examples/vision/classification/paddleclas)                     | 31.4      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/GhostNet](examples/vision/classification/paddleclas)                         | 20.8      | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV1](examples/vision/classification/paddleclas)                      | 17        | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV2](examples/vision/classification/paddleclas)                      | 14.2      | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV3](examples/vision/classification/paddleclas)                      | 22        | ✅       | ✅       | ❔                             | ✅                                    | ❔                                 | ❔                                 | --      |
+| Classification     | [PaddleClas/ShuffleNetV2](examples/vision/classification/paddleclas)                     | 9.2       | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/SqueezeNetV1.1](examples/vision/classification/paddleclas)                   | 5         | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/Inceptionv3](examples/vision/classification/paddleclas)                      | 95.5      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/PP-HGNet](examples/vision/classification/paddleclas)                         | 59        | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Detection          | [PaddleDetection/PP-PicoDet_s_320_coco_lcnet](examples/vision/detection/paddledetection) | 4.9       | ✅       | ✅       | ✅                             | ✅                                    | ✅                                 | ✅                                 | --      |
+| Face Detection     | [deepinsight/SCRFD](./examples/vision/facedet/scrfd)                                     | 2.5       | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Keypoint Detection | [PaddleDetection/PP-TinyPose](examples/vision/keypointdetection/tiny_pose)               | 5.5       | ✅       | ✅       | ❔                             | ❔                                    | ❔                                 | ❔                                 | --      |
+| Segmentation       | [PaddleSeg/PP-LiteSeg(STDC1)](examples/vision/segmentation/paddleseg)                    | 32.2      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/PP-HumanSeg-Lite](examples/vision/segmentation/paddleseg)                     | 0.556     | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/HRNet-w18](examples/vision/segmentation/paddleseg)                            | 38.7      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/PP-HumanSeg](examples/vision/segmentation/paddleseg)                          | 107.2     | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/Unet](examples/vision/segmentation/paddleseg)                                 | 53.7      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/Deeplabv3](examples/vision/segmentation/paddleseg)                            | 150       | ❔       | ✅       | ✅                             |                                      |                                   |                                   |         |
+| OCR                | [PaddleOCR/PP-OCRv2](examples/vision/ocr/PP-OCRv2)                                       | 2.3+4.4   | ✅       | ✅       | ❔                             | --                                   | --                                | --                                | --      |
+| OCR                | [PaddleOCR/PP-OCRv3](examples/vision/ocr/PP-OCRv3)                                       | 2.4+10.6  | ✅       | ❔       | ❔                             | ❔                                    | ❔                                 | ❔                                 | --      |
+
+
+</div></details>
+
+## 🌐 🌐 Web और एप्लेट तैनाती
+
+<div id="fastdeploy-web-models"></div>
+
+<details open><summary><b>Web और मिनी प्रोग्राम परिनियोजन समर्थन सूची (ढहने के लिए क्लिक करें)</b></summary><div>
+
+| कार्य परिदृश्य              | नमूना                                                                                          | [web_demo](examples/application/js/web_demo) |
+|:------------------:|:-------------------------------------------------------------------------------------------:|:--------------------------------------------:|
+| ---                | ---                                                                                         | [Paddle.js](examples/application/js)         |
+| Detection          | [FaceDetection](examples/application/js/web_demo/src/pages/cv/detection)                    | ✅                                            |
+| Detection          | [ScrewDetection](examples/application/js/web_demo/src/pages/cv/detection)                   | ✅                                            |
+| Segmentation       | [PaddleSeg/HumanSeg](./examples/application/js/web_demo/src/pages/cv/segmentation/HumanSeg) | ✅                                            |
+| Object Recognition | [GestureRecognition](examples/application/js/web_demo/src/pages/cv/recognition)             | ✅                                            |
+| Object Recognition | [ItemIdentification](examples/application/js/web_demo/src/pages/cv/recognition)             | ✅                                            |
+| OCR                | [PaddleOCR/PP-OCRv3](./examples/application/js/web_demo/src/pages/cv/ocr)                   | ✅                                            |
+
+</div></details>
+
+
+<div id="fastdeploy-acknowledge"></div>
+
+## Acknowledge
+
+यह परियोजना SDK पीढ़ी और डाउनलोड हम [EasyEdge](https://ai.baidu.com/easyedge/app/openSource) में मुक्त और खुली क्षमताओं का उपयोग करने के लिए आभारी हैं।
+
+## License
+
+<div id="fastdeploy-license"></div>
+
+FastDeploy निम्नानुसार है [Apache-2.0 खुला स्रोत लाइसेंस](./LICENSE)。
diff --git a/docs/docs_i18n/README_한국어.md b/docs/docs_i18n/README_한국어.md
new file mode 100644
index 000000000..f9ca96d1e
--- /dev/null
+++ b/docs/docs_i18n/README_한국어.md
@@ -0,0 +1,335 @@
+[English](../../README_EN.md) | [简体中文](../../README_CN.md) | [हिन्दी](./README_हिन्दी.md) | [日本語](./README_日本語.md) | 한국인 | [Pу́сский язы́к](.//README_Ру́сский_язы́к.md)
+
+![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)
+
+</p>
+
+<p align="center">
+    <a href="./LICENSE"><img src="https://img.shields.io/badge/license-Apache%202-dfd.svg"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/releases"><img src="https://img.shields.io/github/v/release/PaddlePaddle/FastDeploy?color=ffa"></a>
+    <a href=""><img src="https://img.shields.io/badge/python-3.7+-aff.svg"></a>
+    <a href=""><img src="https://img.shields.io/badge/os-linux%2C%20win%2C%20mac-pink.svg"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/graphs/contributors"><img src="https://img.shields.io/github/contributors/PaddlePaddle/FastDeploy?color=9ea"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/commits"><img src="https://img.shields.io/github/commit-activity/m/PaddlePaddle/FastDeploy?color=3af"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/issues"><img src="https://img.shields.io/github/issues/PaddlePaddle/FastDeploy?color=9cc"></a>
+    <a href="https://github.com/PaddlePaddle/FastDeploy/stargazers"><img src="https://img.shields.io/github/stars/PaddlePaddle/FastDeploy?color=ccf"></a>
+</p>
+
+<p align="center">
+    <a href="/docs/cn/build_and_install"><b> 설치  </b></a>
+    |
+    <a href="docs/README_CN.md"><b> 문서 사용하기  </b></a>
+    |
+    <a href="https://baidu-paddle.github.io/fastdeploy-api/"><b> API문서   </b></a>
+    |
+    <a href="https://github.com/PaddlePaddle/FastDeploy/releases"><b> 로그 업데이트 </b></a>
+</p>
+
+**⚡Fastdeploy** 장면쉽게 유연 한 극,효율적 AI 추리 도구 가 배치 돼 있다.📦 제공 개표 즉의**구름을 단**부처 체험 지원 넘 🔥 150 +**text**,**비전**,**speech**과**다른 모드**모델 🔚 실현에 차 려 단'의 추리 성능 최적화 한다.이미지 분류, 객체 검출, 이미지 분할, 얼굴 검출, 얼굴 인식, 포인트 검출, 퍼팅, OCR, NLP, TTS 등의 작업을 포함하고 있어 개발자의**다중 장면, 다중 하드웨어, 다중 플랫폼**을 위한 산업 배치 요구를 충족시킨다.
+
+| [Image Classification](examples/vision/classification)                                                                                         | [Object Detection](examples/vision/detection)                                                                                                  | [Semantic Segmentation](examples/vision/segmentation/paddleseg)                                                                                  | [Potrait Segmentation](examples/vision/segmentation/paddleseg)                                                                                                                                                                                                                                                                                                           |
+|:----------------------------------------------------------------------------------------------------------------------------------------------:|:----------------------------------------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|
+| <img src='https://user-images.githubusercontent.com/54695910/200465949-da478e1b-21ce-43b8-9f3f-287460e786bd.png' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054680-2f8d1952-c120-4b67-88fc-7d2d7d2378b4.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054711-6119f0e7-d741-43b1-b273-9493d103d49f.gif' height="126px" width="190px">   | <img src='https://user-images.githubusercontent.com/54695910/188054718-6395321c-8937-4fa0-881c-5b20deb92aaa.gif' height="126px" width="190px">                                                                                                                                                                                                                           |
+| [**Image Matting**](examples/vision/matting)                                                                                                   | [**Real-Time Matting**](examples/vision/matting)                                                                                               | [**OCR**](examples/vision/ocr)                                                                                                                   | [**Face Alignment**](examples/vision/facealign)                                                                                                                                                                                                                                                                                                                          |
+| <img src='https://user-images.githubusercontent.com/54695910/188058231-a5fe1ce1-0a38-460f-9582-e0b881514908.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054691-e4cb1a70-09fe-4691-bc62-5552d50bd853.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/188054669-a85996ba-f7f3-4646-ae1f-3b7e3e353e7d.gif' height="126px" width="190px"  > | <img src='https://user-images.githubusercontent.com/54695910/188059460-9845e717-c30a-4252-bd80-b7f6d4cf30cb.png' height="126px" width="190px">                                                                                                                                                                                                                           |
+| [**Pose Estimation**](examples/vision/keypointdetection)                                                                                       | [**Behavior Recognition**](https://github.com/PaddlePaddle/FastDeploy/issues/6)                                                                | [**NLP**](examples/text)                                                                                                                         | [**Speech**](examples/audio/pp-tts)                                                                                                                                                                                                                                                                                                                                      |
+| <img src='https://user-images.githubusercontent.com/54695910/188054671-394db8dd-537c-42b1-9d90-468d7ad1530e.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/48054808/173034825-623e4f78-22a5-4f14-9b83-dc47aa868478.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/200162475-f5d85d70-18fb-4930-8e7e-9ca065c1d618.gif' height="126px" width="190px">   | <p align="left">**input** ：早上好今天是2020<br>/10/29，最低温度是-3°C。<br><br> <p align="left">**output**: [<img src="https://user-images.githubusercontent.com/54695910/200161645-871e08da-5a31-4736-879c-a88bb171a676.png" width="170" style="max-width: 100%;">](https://paddlespeech.bj.bcebos.com/Parakeet/docs/demos/parakeet_espnet_fs2_pwg_demo/tn_g2p/parakeet/001.wav)</p> |
+
+
+## **지역 사회 교류**
+
+*  **Slack**：Join our [Slack community](https://join.slack.com/t/fastdeployworkspace/shared_invite/zt-1jznah134-3rxY~ytRb8rcPqkn9g~PDg) and chat with other community members about ideas
+
+*  **위챗**: QR 코드를 스캔하고 설문지를 기입하여 기술 커뮤니티에 가입하며 커뮤니티 개발자와 함께 배치의 통점과 방안을 토론한다
+
+<div align="center">
+    <img src="https://user-images.githubusercontent.com/54695910/200145290-d5565d18-6707-4a0b-a9af-85fd36d35d13.jpg" width = "220" height = "220" />
+</div>
+
+## 목록
+
+* **🖥️ 서버측 배포**
+
+  * [Python SDK 빠른 시작](#fastdeploy-quick-start-python)  
+  * [C++ SDK 시작](#fastdeploy-quick-start-cpp)
+  * [서비스 모델 지원 목록](#fastdeploy-server-models)
+
+* **📲 모바일 및 측면 배치**
+
+  * [측면 모델 지원 목록](#fastdeploy-edge-models)
+
+* **🌐 웹과 애플릿 배포**  
+
+  * [웹 쪽 모델 지원 목록](#fastdeploy-web-models)
+* [Acknowledge](#fastdeploy-acknowledge)  
+* [License](#fastdeploy-license)
+
+## 🖥️ 서비스 배포
+
+<div id="fastdeploy-quick-start-python"></div>
+
+<details close>
+
+<summary><b>파이썬 SDK 빠른 시작 (자세한내용은 클릭)</b></summary><div>
+
+#### 빠른 설치 
+
+#####  선행의존성
+
+- CUDA >= 11.2、cuDNN >= 8.0、Python >= 3.6
+- OS: Linux x86_64/macOS/Windows 10
+
+##### GPU 버전을 설치합니다 
+
+```bash
+pip install numpy opencv-python fastdeploy-gpu-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
+```
+
+##### [Conda 설치 (추천) ](docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+```bash
+conda config --add channels conda-forge && conda install cudatoolkit=11.2 cudnn=8.2
+```
+
+##### CPU 버전 설치
+
+```bash
+pip install numpy opencv-python fastdeploy-python -f https://www.paddlepaddle.org.cn/whl/fastdeploy.html
+```
+
+#### Python 추리 예제  
+
+*  모형과 그림을 준비하다 
+
+```bash
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+```
+
+* 테스트 추론 결과
+
+```python
+# GPU/TensorRT 배치 참조 examples/vision/detection/paddledetection/python
+import cv2
+import fastdeploy.vision as vision
+
+model = vision.detection.PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
+                                 "ppyoloe_crn_l_300e_coco/model.pdiparams",
+                                 "ppyoloe_crn_l_300e_coco/infer_cfg.yml")
+im = cv2.imread("000000014439.jpg")
+result = model.predict(im.copy())
+print(result)
+
+vis_im = vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("vis_image.jpg", vis_im)
+
+```
+
+</div></details>
+
+<div id="fastdeploy-quick-start-cpp"></div>
+
+<details close>
+
+<summary><b> C++ SDK 빠른 시작 (클릭 후 자세히 보기) </b></summary><div>
+
+
+#### 설치 
+
+[C++ 라이브러리 다운로드](docs/cn/build_and_install/download_prebuilt_libraries.md)참조u
+
+#### C++ 추론 예제
+
+* 모형과 그림을 준비하다
+
+```bash
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco.tgz
+tar xvf ppyoloe_crn_l_300e_coco.tgz
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+```
+
+* 추리 결과를 테스트하다
+
+```C++
+// GPU/TensorRT배치 참조examples/vision/detection/paddledetection/cpp
+#include "fastdeploy/vision.h"
+
+int main(int argc, char* argv[]) {
+  namespace vision = fastdeploy::vision;
+  auto model = vision::detection::PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
+                                          "ppyoloe_crn_l_300e_coco/model.pdiparams",
+                                          "ppyoloe_crn_l_300e_coco/infer_cfg.yml");
+  auto im = cv::imread("000000014439.jpg");
+
+  vision::DetectionResult res;
+  model.Predict(&im, &res);
+
+  auto vis_im = vision::Visualize::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_image.jpg", vis_im);
+  return 0;
+}
+```
+
+</div></details>
+
+더 많은 배치 사례를 참고하시기 바랍니다 [모델 배포 예제](examples).
+
+<div id="fastdeploy-server-models"></div>
+
+### 서비스 모델 지원 목록🔥🔥🔥🔥🔥
+
+부호 설명: (1)  ✅: 지원 되여 있어야 한다; (2) ❔:진행 중이다; (3) N/A:지원되지 않습니다;<br>
+
+<details open><summary><b> 서비스 모델 지원 목록 (누르면 축소 가능)</b></summary><div>
+
+<div align="center">
+  <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png"/>
+</div>
+
+| 작업 장면                  | 모형                                                                                          | Linux                                            | Linux      | Win     | Win        | Mac     | Mac     | Linux       | Linux           | Linux         | Linux         | Linux   |
+|:----------------------:|:--------------------------------------------------------------------------------------------:|:------------------------------------------------:|:----------:|:-------:|:----------:|:-------:|:-------:|:-----------:|:---------------:|:-------------:|:-------------:|:-------:|
+| ---                    | ---                                                                                          | X86 CPU                                          | NVIDIA GPU | X86 CPU | NVIDIA GPU | X86 CPU | Arm CPU | AArch64 CPU |  Phytium D2000CPU | NVIDIA Jetson | Graphcore IPU | Serving |
+| Classification         | [PaddleClas/ResNet50](./examples/vision/classification/paddleclas)                           | [✅](./examples/vision/classification/paddleclas) | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [TorchVison/ResNet](examples/vision/classification/resnet)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Classification         | [ltralytics/YOLOv5Cls](examples/vision/classification/yolov5cls)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Classification         | [PaddleClas/PP-LCNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/PP-LCNetv2](./examples/vision/classification/paddleclas)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/EfficientNet](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/GhostNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV1](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV2](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/MobileNetV3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/ShuffleNetV2](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/SqueeezeNetV1.1](./examples/vision/classification/paddleclas)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Classification         | [PaddleClas/Inceptionv3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Classification         | [PaddleClas/PP-HGNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOE](./examples/vision/detection/paddledetection)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PicoDet](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/YOLOX](./examples/vision/detection/paddledetection)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅               | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/YOLOv3](./examples/vision/detection/paddledetection)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLO](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOv2](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/Faster-RCNN](./examples/vision/detection/paddledetection)                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [PaddleDetection/Mask-RCNN](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [Megvii-BaseDetection/YOLOX](./examples/vision/detection/yolox)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7](./examples/vision/detection/yolov7)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_trt](./examples/vision/detection/yolov7end2end_trt)                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_ort_](./examples/vision/detection/yolov7end2end_ort)               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [meituan/YOLOv6](./examples/vision/detection/yolov6)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [ultralytics/YOLOv5](./examples/vision/detection/yolov5)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Detection              | [WongKinYiu/YOLOR](./examples/vision/detection/yolor)                                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Detection              | [WongKinYiu/ScaledYOLOv4](./examples/vision/detection/scaledyolov4)                          | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [ppogg/YOLOv5Lite](./examples/vision/detection/yolov5lite)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Detection              | [RangiLyu/NanoDetPlus](./examples/vision/detection/nanodet_plus)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| KeyPoint               | [PaddleDetection/TinyPose](./examples/vision/keypointdetection/tiny_pose)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| KeyPoint               | [PaddleDetection/PicoDet + TinyPose](./examples/vision/keypointdetection/det_keypoint_unite) | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| HeadPose               | [omasaht/headpose](examples/vision/headpose)                                                 | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Tracking               | [PaddleDetection/PP-Tracking](examples/vision/tracking/pptracking)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv2](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv3](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
+| Segmentation           | [PaddleSeg/PP-LiteSeg](./examples/vision/segmentation/paddleseg)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegLite](./examples/vision/segmentation/paddleseg)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/HRNet](./examples/vision/segmentation/paddleseg)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegServer](./examples/vision/segmentation/paddleseg)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/Unet](./examples/vision/segmentation/paddleseg)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Segmentation           | [PaddleSeg/Deeplabv3](./examples/vision/segmentation/paddleseg)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [biubug6/RetinaFace](./examples/vision/facedet/retinaface)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [Linzaer/UltraFace](./examples/vision/facedet/ultraface)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [deepcam-cn/YOLOv5Face](./examples/vision/facedet/yolov5face)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceDetection          | [insightface/SCRFD](./examples/vision/facedet/scrfd)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [Hsintao/PFLD](examples/vision/facealign/pfld)                                               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [Single430FaceLandmark1000](./examples/vision/facealign/face_landmark_1000)                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceAlign              | [jhb86253817/PIPNet](./examples/vision/facealign)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/ArcFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/CosFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/PartialFC](./examples/vision/faceid/insightface)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| FaceRecognition        | [insightface/VPL](./examples/vision/faceid/insightface)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [ZHKKKe/MODNet](./examples/vision/matting/modnet)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Matting                | [PeterL1n/RobustVideoMatting]()                                                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/PP-Matting](./examples/vision/matting/ppmatting)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/PP-HumanMatting](./examples/vision/matting/modnet)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Matting                | [PaddleSeg/ModNet](./examples/vision/matting/modnet)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/BasicVSR](./)                                                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/EDVR](./examples/vision/sr/edvr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Video Super-Resolution | [PaddleGAN/PP-MSVSR](./examples/vision/sr/ppmsvsr)                                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
+| Information Extraction | [PaddleNLP/UIE](./examples/text/uie)                                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           |         |
+| NLP                    | [PaddleNLP/ERNIE-3.0](./examples/text/ernie-3.0)                                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | ❔                           | ✅       |
+| Speech                 | [PaddleSpeech/PP-TTS](./examples/audio/pp-tts)                                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | --                          | ✅       |
+
+
+</div></details>
+
+<div id="fastdeploy-edge-doc"></div>
+
+## 📲  모바일 및 측면 배치  🔥🔥🔥🔥
+
+<div id="fastdeploy-edge-models"></div>
+
+### 측면 모델 지원 목록
+<details open><summary><b>측면 모델 지원 목록 (누르면 축소 가능)</b></summary><div>
+
+<div align="center">
+  <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png"  />
+</div>
+
+| 작업 장면             | 모형                                                                                         | 크기(MB)   | Linux   | Android | Linux     | Linux                   | Linux                          | Linux                       | Linux                            | TBD...  |
+|:------------------:|:-----------------------------------------------------------------------------------------:|:--------:|:-------:|:-------:|:-------:|:-----------------------:|:------------------------------:|:---------------------------:|:--------------------------------:|:-------:|
+| ---                | ---                                                                                       | ---      | ARM CPU | ARM CPU | Rockchip-NPU<br>RK3568/RK3588 | Rockchip-NPU<br>RV1109/RV1126/RK1808 |  Amlogic-NPU <br>A311D/S905D/C308X |  NXP-NPU<br>i.MX&nbsp;8M&nbsp;Plus | TBD...｜ |
+| Classification     | [PaddleClas/ResNet50](examples/vision/classification/paddleclas)                         | 98        | ✅       | ✅       |  ❔                             |      ✅                                |                                   |                                   |         |
+| Classification     | [PaddleClas/PP-LCNet](examples/vision/classification/paddleclas)                         | 11.9      | ✅       | ✅       | ❔                             | ✅                                 | --                                | --                                | --      |
+| Classification     | [PaddleClas/PP-LCNetv2](examples/vision/classification/paddleclas)                       | 26.6      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/EfficientNet](examples/vision/classification/paddleclas)                     | 31.4      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/GhostNet](examples/vision/classification/paddleclas)                         | 20.8      | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV1](examples/vision/classification/paddleclas)                      | 17        | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV2](examples/vision/classification/paddleclas)                      | 14.2      | ✅       | ✅       | ❔                             | ✅                                  | --                                | --                                | --      |
+| Classification     | [PaddleClas/MobileNetV3](examples/vision/classification/paddleclas)                      | 22        | ✅       | ✅       | ❔                             | ✅                                    | ❔                                 | ❔                                 | --      |
+| Classification     | [PaddleClas/ShuffleNetV2](examples/vision/classification/paddleclas)                     | 9.2       | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/SqueezeNetV1.1](examples/vision/classification/paddleclas)                   | 5         | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/Inceptionv3](examples/vision/classification/paddleclas)                      | 95.5      | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Classification     | [PaddleClas/PP-HGNet](examples/vision/classification/paddleclas)                         | 59        | ✅       | ✅       | ❔                             | ✅                                   | --                                | --                                | --      |
+| Detection          | [PaddleDetection/PP-PicoDet_s_320_coco_lcnet](examples/vision/detection/paddledetection) | 4.9       | ✅       | ✅       | ✅                             | ✅                                    | ✅                                 | ✅                                 | --      |
+| Face Detection     | [deepinsight/SCRFD](./examples/vision/facedet/scrfd)                                     | 2.5       | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Keypoint Detection | [PaddleDetection/PP-TinyPose](examples/vision/keypointdetection/tiny_pose)               | 5.5       | ✅       | ✅       | ❔                             | ❔                                    | ❔                                 | ❔                                 | --      |
+| Segmentation       | [PaddleSeg/PP-LiteSeg(STDC1)](examples/vision/segmentation/paddleseg)                    | 32.2      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/PP-HumanSeg-Lite](examples/vision/segmentation/paddleseg)                     | 0.556     | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/HRNet-w18](examples/vision/segmentation/paddleseg)                            | 38.7      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/PP-HumanSeg](examples/vision/segmentation/paddleseg)                          | 107.2     | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/Unet](examples/vision/segmentation/paddleseg)                                 | 53.7      | ✅       | ✅       | ✅                             | --                                   | --                                | --                                | --      |
+| Segmentation       | [PaddleSeg/Deeplabv3](examples/vision/segmentation/paddleseg)                            | 150       | ❔       | ✅       | ✅                             |                                      |                                   |                                   |         |
+| OCR                | [PaddleOCR/PP-OCRv2](examples/vision/ocr/PP-OCRv2)                                       | 2.3+4.4   | ✅       | ✅       | ❔                             | --                                   | --                                | --                                | --      |
+| OCR                | [PaddleOCR/PP-OCRv3](examples/vision/ocr/PP-OCRv3)                                       | 2.4+10.6  | ✅       | ❔       | ❔                             | ❔                                    | ❔                                 | ❔                                 | --      |
+
+
+</div></details>
+
+## 🌐 🌐 웹과 애플 릿 포치
+
+<div id="fastdeploy-web-models"></div>
+
+<details open><summary><b>웹 및 애플릿 배포 지원 목록 (누르면 축소)</b></summary><div>
+
+| 작업 장면              | 모형                                                                                          | [web_demo](examples/application/js/web_demo) |
+|:------------------:|:-------------------------------------------------------------------------------------------:|:--------------------------------------------:|
+| ---                | ---                                                                                         | [Paddle.js](examples/application/js)         |
+| Detection          | [FaceDetection](examples/application/js/web_demo/src/pages/cv/detection)                    | ✅                                            |
+| Detection          | [ScrewDetection](examples/application/js/web_demo/src/pages/cv/detection)                   | ✅                                            |
+| Segmentation       | [PaddleSeg/HumanSeg](./examples/application/js/web_demo/src/pages/cv/segmentation/HumanSeg) | ✅                                            |
+| Object Recognition | [GestureRecognition](examples/application/js/web_demo/src/pages/cv/recognition)             | ✅                                            |
+| Object Recognition | [ItemIdentification](examples/application/js/web_demo/src/pages/cv/recognition)             | ✅                                            |
+| OCR                | [PaddleOCR/PP-OCRv3](./examples/application/js/web_demo/src/pages/cv/ocr)                   | ✅                                            |
+
+</div></details>
+
+
+<div id="fastdeploy-acknowledge"></div>
+
+## Acknowledge
+
+이 프로젝트의 SDK 생성 및 다운로드는 EasyEdge (https://ai.baidu.com/easyedge/app/openSource) 의 무료 오픈 기능을 사용하여 진행되었습니다. 이에 감사드립니다.
+
+## License
+
+<div id="fastdeploy-license"></div>
+
+Fastdeploy 컴플라이언스 [Apache e-2.0 오픈 소스 프로토콜](./LICENSE)。

From a710792e989399704c245efcad0087a95039310d Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Tue, 13 Dec 2022 16:40:18 +0800
Subject: [PATCH 36/77] Update README_EN.md

---
 README_EN.md | 25 ++++++++++++++++++-------
 1 file changed, 18 insertions(+), 7 deletions(-)

diff --git a/README_EN.md b/README_EN.md
index 1157caa7d..58711bc06 100755
--- a/README_EN.md
+++ b/README_EN.md
@@ -1,4 +1,5 @@
-English | [简体中文](README_CN.md)
+English | [简体中文](README_CN.md) | [हिन्दी](./docs/docs_i18n/README_हिन्दी.md) | [日本語](./docs/docs_i18n/README_日本語.md) | [한국인](./docs/docs_i18n/README_한국어.md) | [Pу́сский язы́к](./docs/docs_i18n/README_Ру́сский_язы́к.md)
+
 
 ![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)
 
@@ -36,15 +37,15 @@ Including image classification, object detection, image segmentation, face detec
 | [**Pose Estimation**](examples/vision/keypointdetection)                                                                                       | [**Behavior Recognition**](https://github.com/PaddlePaddle/FastDeploy/issues/6)                                                                | [**NLP**](examples/text)                                                                                                                         | [**Speech**](examples/audio/pp-tts)                                                                                                                                                                                                                                                                                                                                                                                        |
 | <img src='https://user-images.githubusercontent.com/54695910/188054671-394db8dd-537c-42b1-9d90-468d7ad1530e.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/48054808/173034825-623e4f78-22a5-4f14-9b83-dc47aa868478.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/200162475-f5d85d70-18fb-4930-8e7e-9ca065c1d618.gif' height="126px" width="190px">   | <p align="left">**input**:Life was like a box<br> of chocolates, you never<br> know what you're <br>gonna get.<br> <p align="left">**output**: [<img src="https://user-images.githubusercontent.com/54695910/200161645-871e08da-5a31-4736-879c-a88bb171a676.png" width="150" style="max-width: 100%;">](https://paddlespeech.bj.bcebos.com/Parakeet/docs/demos/tacotron2_ljspeech_waveflow_samples_0.2/sentence_1.wav)</p> |
 
-## 👬 Community
 
- - **Slack**：Join our [Slack community](https://join.slack.com/t/fastdeployworkspace/shared_invite/zt-1jznah134-3rxY~ytRb8rcPqkn9g~PDg) and chat with other community members about ideas.
 
- - **WeChat**：Scan the QR code below using WeChat, follow the PaddlePaddle official account and fill out the questionnaire to join the WeChat group.
+## 📣 Recent updates
+- 💥 **Live Preview: Dec 12 - Dec 30, China Standard Time, 20:30,** FastDeploy has joined hands with ten hardware vendor partners to launch the deployment month `The Complete Guide to Deploying Industrial Grade AI Models`.
+  - Scan the QR code below using WeChat, follow the PaddlePaddle official account and fill out the questionnaire to join the WeChat group
 
-    <div align="center">
-    <img src="https://user-images.githubusercontent.com/54695910/200145290-d5565d18-6707-4a0b-a9af-85fd36d35d13.jpg" width = "200" height = "200" />
-    </div>
+<div align="center">
+<img src="https://user-images.githubusercontent.com/54695910/207262688-4225bc39-4337-4966-a5cc-26bd6557d226.jpg"  width = "150" height = "150" />
+</div>
 
 ## Contents
 
@@ -318,6 +319,16 @@ Notes: ✅: already supported; ❔: to be supported in the future;  N/A: Not Ava
 | OCR                | [PaddleOCR/PP-OCRv3](./examples/application/js/web_demo/src/pages/cv/ocr)                   | ✅                                            |
 
 </div></details>
+    
+## 👬 Community
+
+ - **Slack**：Join our [Slack community](https://join.slack.com/t/fastdeployworkspace/shared_invite/zt-1jznah134-3rxY~ytRb8rcPqkn9g~PDg) and chat with other community members about ideas.
+
+ - **WeChat**：Scan the QR code below using WeChat, follow the PaddlePaddle official account and fill out the questionnaire to join the WeChat group.
+
+    <div align="center">
+    <img src="https://user-images.githubusercontent.com/54695910/200145290-d5565d18-6707-4a0b-a9af-85fd36d35d13.jpg" width = "200" height = "200" />
+    </div>
 
 
 ## Acknowledge

From 8610a00b2b31a94c955b3e0f50389e42a1d8fec0 Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Tue, 13 Dec 2022 16:42:01 +0800
Subject: [PATCH 37/77] Update README_CN.md

---
 README_CN.md | 21 +++++++++++++++------
 1 file changed, 15 insertions(+), 6 deletions(-)

diff --git a/README_CN.md b/README_CN.md
index 8814215fe..9e90fbeab 100755
--- a/README_CN.md
+++ b/README_CN.md
@@ -1,4 +1,4 @@
-[English](README_EN.md) | 简体中文
+[English](README_EN.md) | 简体中文 | [हिन्दी](./docs/docs_i18n/README_हिन्दी.md) | [日本語](./docs/docs_i18n/README_日本語.md) | [한국인](./docs/docs_i18n/README_한국어.md) | [Pу́сский язы́к](./docs/docs_i18n/README_Ру́сский_язы́к.md)
 
 ![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)
 
@@ -36,16 +36,15 @@
 | <img src='https://user-images.githubusercontent.com/54695910/188054671-394db8dd-537c-42b1-9d90-468d7ad1530e.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/48054808/173034825-623e4f78-22a5-4f14-9b83-dc47aa868478.gif' height="126px" width="190px"> | <img src='https://user-images.githubusercontent.com/54695910/200162475-f5d85d70-18fb-4930-8e7e-9ca065c1d618.gif' height="126px" width="190px">   | <p align="left">**input** ：早上好今天是2020<br>/10/29，最低温度是-3°C。<br><br> <p align="left">**output**: [<img src="https://user-images.githubusercontent.com/54695910/200161645-871e08da-5a31-4736-879c-a88bb171a676.png" width="170" style="max-width: 100%;">](https://paddlespeech.bj.bcebos.com/Parakeet/docs/demos/parakeet_espnet_fs2_pwg_demo/tn_g2p/parakeet/001.wav)</p> |
 
 
-## **社区交流**
+## 📣 最新消息
 
-*  **Slack**：Join our [Slack community](https://join.slack.com/t/fastdeployworkspace/shared_invite/zt-1jznah134-3rxY~ytRb8rcPqkn9g~PDg) and chat with other community members about ideas
-
-*  **微信**：扫描二维码，填写问卷加入技术社区，与社区开发者探讨部署的痛点与方案
+- **💥直播预告：2022.12.12 ~ 2022.12.30日每晚20:30，联合十家硬件厂商伙伴，推出部署月《产业级AI模型部署全攻略》**。微信扫描下方二维码，关注公众号并填写问卷后进入官方交流群，与行业精英共同探讨AI部署话题。</font>
 
 <div align="center">
-    <img src="https://user-images.githubusercontent.com/54695910/200145290-d5565d18-6707-4a0b-a9af-85fd36d35d13.jpg" width = "220" height = "220" />
+<img src="https://user-images.githubusercontent.com/54695910/207262688-4225bc39-4337-4966-a5cc-26bd6557d226.jpg"  width = "150" height = "150" />
 </div>
 
+
 ## 目录
 
 * **🖥️ 服务器端部署**
@@ -322,6 +321,16 @@ int main(int argc, char* argv[]) {
 
 </div></details>
 
+## **社区交流**
+
+*  **Slack**：Join our [Slack community](https://join.slack.com/t/fastdeployworkspace/shared_invite/zt-1jznah134-3rxY~ytRb8rcPqkn9g~PDg) and chat with other community members about ideas
+
+*  **微信**：扫描二维码，填写问卷加入技术社区，与社区开发者探讨部署的痛点与方案
+
+<div align="center">
+    <img src="https://user-images.githubusercontent.com/54695910/200145290-d5565d18-6707-4a0b-a9af-85fd36d35d13.jpg" width = "220" height = "220" />
+</div>
+
 
 <div id="fastdeploy-acknowledge"></div>
 

From d6d7df4472d7715a686835772ed65e05ef686ca8 Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Tue, 13 Dec 2022 17:14:27 +0800
Subject: [PATCH 38/77] Update README_EN.md

---
 README_EN.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README_EN.md b/README_EN.md
index 58711bc06..820f8b047 100755
--- a/README_EN.md
+++ b/README_EN.md
@@ -1,4 +1,4 @@
-English | [简体中文](README_CN.md) | [हिन्दी](./docs/docs_i18n/README_हिन्दी.md) | [日本語](./docs/docs_i18n/README_日本語.md) | [한국인](./docs/docs_i18n/README_한국어.md) | [Pу́сский язы́к](./docs/docs_i18n/README_Ру́сский_язы́к.md)
+English | [简体中文](README_CN.md) | [हिन्दी](./docs/docs_i18n/README_हिन्दी.md) | [日本語](./docs/docs_i18n/README_日本語.md) | [한국인](./docs/docs_i18n/README_한국어.md) | [Pу́сский язы́к](./docs/docs_i18n/README_Ру́сский_язы́к.md)
 
 
 ![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)

From c64b24e4f2dd7add6980b4274da7b637790c44ed Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Tue, 13 Dec 2022 17:15:20 +0800
Subject: [PATCH 39/77] Update README_EN.md

---
 README_EN.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README_EN.md b/README_EN.md
index 820f8b047..3abffec44 100755
--- a/README_EN.md
+++ b/README_EN.md
@@ -1,4 +1,4 @@
-English | [简体中文](README_CN.md) | [हिन्दी](./docs/docs_i18n/README_हिन्दी.md) | [日本語](./docs/docs_i18n/README_日本語.md) | [한국인](./docs/docs_i18n/README_한국어.md) | [Pу́сский язы́к](./docs/docs_i18n/README_Ру́сский_язы́к.md)
+English | [简体中文](README_CN.md) | [हिन्दी](./docs/docs_i18n/README_हिन्दी.md) | [日本語](./docs/docs_i18n/README_日本語.md) | [한국인](./docs/docs_i18n/README_한국어.md) | [Pу́сский язы́к](./docs/docs_i18n/README_Ру́сский_язы́к.md)
 
 
 ![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)

From 0a13cbf2fc30901a105d6eb1ba480b533d10c10e Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Tue, 13 Dec 2022 17:16:06 +0800
Subject: [PATCH 40/77] Update README_CN.md

---
 README_CN.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README_CN.md b/README_CN.md
index 9e90fbeab..4c7f1bdc2 100755
--- a/README_CN.md
+++ b/README_CN.md
@@ -1,4 +1,4 @@
-[English](README_EN.md) | 简体中文 | [हिन्दी](./docs/docs_i18n/README_हिन्दी.md) | [日本語](./docs/docs_i18n/README_日本語.md) | [한국인](./docs/docs_i18n/README_한국어.md) | [Pу́сский язы́к](./docs/docs_i18n/README_Ру́сский_язы́к.md)
+[English](README_EN.md) | 简体中文 | [हिन्दी](./docs/docs_i18n/README_हिन्दी.md) | [日本語](./docs/docs_i18n/README_日本語.md) | [한국인](./docs/docs_i18n/README_한국어.md) | [Pу́сский язы́к](./docs/docs_i18n/README_Ру́сский_язы́к.md)
 
 ![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)
 

From 760b79d31b8b4f92ab4b08e92ae7fff95f00e7a2 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Tue, 13 Dec 2022 20:17:59 +0800
Subject: [PATCH 41/77] Update README_CN.md

---
 README_CN.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README_CN.md b/README_CN.md
index 4c7f1bdc2..2cbf2ff45 100755
--- a/README_CN.md
+++ b/README_CN.md
@@ -117,7 +117,7 @@ model = vision.detection.PPYOLOE("ppyoloe_crn_l_300e_coco/model.pdmodel",
                                  "ppyoloe_crn_l_300e_coco/model.pdiparams",
                                  "ppyoloe_crn_l_300e_coco/infer_cfg.yml")
 im = cv2.imread("000000014439.jpg")
-result = model.predict(im.copy())
+result = model.predict(im)
 print(result)
 
 vis_im = vision.vis_detection(im, result, score_threshold=0.5)
@@ -162,7 +162,7 @@ int main(int argc, char* argv[]) {
   auto im = cv::imread("000000014439.jpg");
 
   vision::DetectionResult res;
-  model.Predict(&im, &res);
+  model.Predict(im, &res);
 
   auto vis_im = vision::Visualize::VisDetection(im, res, 0.5);
   cv::imwrite("vis_image.jpg", vis_im);

From 92484bdbf26ed715372018d479e63ff4c42c7466 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Tue, 13 Dec 2022 20:29:28 +0800
Subject: [PATCH 42/77] Update README_CN.md

---
 docs/README_CN.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/README_CN.md b/docs/README_CN.md
index 5fb8b2127..a0b7b51d0 100644
--- a/docs/README_CN.md
+++ b/docs/README_CN.md
@@ -19,7 +19,7 @@
 - [Runtime Python使用示例](cn/quick_start/runtime/python.md)
 - [Runtime C++使用示例](cn/quick_start/runtime/cpp.md)
 
-## API文档(进行中)
+## API文档
 
 - [Python API文档](https://www.paddlepaddle.org.cn/fastdeploy-api-doc/python/html/)
 - [C++ API文档](https://www.paddlepaddle.org.cn/fastdeploy-api-doc/cpp/html/)

From cab0e5f9cb777edc22725e4f05a4fc69b4dbdea3 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Tue, 13 Dec 2022 21:56:25 +0800
Subject: [PATCH 43/77] Update README.md

---
 examples/vision/detection/paddledetection/serving/README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/vision/detection/paddledetection/serving/README.md b/examples/vision/detection/paddledetection/serving/README.md
index 008fe4f8e..d6a38c8d4 100644
--- a/examples/vision/detection/paddledetection/serving/README.md
+++ b/examples/vision/detection/paddledetection/serving/README.md
@@ -75,7 +75,7 @@ I0928 04:51:15.826578 206 http_server.cc:167] Started Metrics Service at 0.0.0.0
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
 #安装客户端依赖
-python3 -m pip install tritonclient\[all\]
+python3 -m pip install tritonclient[all]
 
 # 发送请求
 python3 paddledet_grpc_client.py

From f601d076e4121824c05d8ede9ef22e3d895a48ab Mon Sep 17 00:00:00 2001
From: yunyaoXYY <109218879+yunyaoXYY@users.noreply.github.com>
Date: Wed, 14 Dec 2022 10:08:31 +0800
Subject: [PATCH 44/77] [Other] Improve some PPOCR API comments. (#875)

* Fix links in readme

* Fix links in readme

* Update PPOCRv2/v3 examples

* Update auto compression configs

* Add neww quantization  support for paddleclas model

* Update quantized Yolov6s model download link

* Improve PPOCR comments
---
 fastdeploy/vision/ocr/ppocr/classifier.h        | 14 ++++++++++++--
 fastdeploy/vision/ocr/ppocr/cls_postprocessor.h |  4 ++--
 fastdeploy/vision/ocr/ppocr/cls_preprocessor.h  |  4 ++--
 fastdeploy/vision/ocr/ppocr/det_preprocessor.h  |  2 +-
 fastdeploy/vision/ocr/ppocr/rec_postprocessor.h |  4 ++--
 fastdeploy/vision/ocr/ppocr/rec_preprocessor.h  |  4 ++--
 fastdeploy/vision/ocr/ppocr/recognizer.h        | 10 +++++++++-
 7 files changed, 30 insertions(+), 12 deletions(-)

diff --git a/fastdeploy/vision/ocr/ppocr/classifier.h b/fastdeploy/vision/ocr/ppocr/classifier.h
index 5a4ed02a0..cd035e269 100755
--- a/fastdeploy/vision/ocr/ppocr/classifier.h
+++ b/fastdeploy/vision/ocr/ppocr/classifier.h
@@ -43,11 +43,21 @@ class FASTDEPLOY_DECL Classifier : public FastDeployModel {
              const ModelFormat& model_format = ModelFormat::PADDLE);
   /// Get model's name
   std::string ModelName() const { return "ppocr/ocr_cls"; }
-  virtual bool Predict(const cv::Mat& img, int32_t* cls_label, float* cls_score);
+
+  /** \brief Predict the input image and get OCR classification model cls_result.
+   *
+   * \param[in] img The input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format.
+   * \param[in] cls_label The label result of cls model will be written in to this param.
+   * \param[in] cls_score The score result of cls model will be written in to this param.
+   * \return true if the prediction is successed, otherwise false.
+   */
+  virtual bool Predict(const cv::Mat& img,
+                      int32_t* cls_label, float* cls_score);
   /** \brief BatchPredict the input image and get OCR classification model cls_result.
    *
    * \param[in] images The list of input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format.
-   * \param[in] cls_results The output of OCR classification model cls_result will be writen to this structure.
+   * \param[in] cls_labels The label results of cls model will be written in to this vector.
+   * \param[in] cls_scores The score results of cls model will be written in to this vector.
    * \return true if the prediction is successed, otherwise false.
    */
   virtual bool BatchPredict(const std::vector<cv::Mat>& images,
diff --git a/fastdeploy/vision/ocr/ppocr/cls_postprocessor.h b/fastdeploy/vision/ocr/ppocr/cls_postprocessor.h
index a755e1294..d9702e1a1 100644
--- a/fastdeploy/vision/ocr/ppocr/cls_postprocessor.h
+++ b/fastdeploy/vision/ocr/ppocr/cls_postprocessor.h
@@ -28,8 +28,8 @@ class FASTDEPLOY_DECL ClassifierPostprocessor {
   /** \brief Process the result of runtime and fill to ClassifyResult structure
    *
    * \param[in] tensors The inference result from runtime
-   * \param[in] cls_labels The output result of classification
-   * \param[in] cls_scores The output result of classification
+   * \param[in] cls_labels The output label results of classification model
+   * \param[in] cls_scores The output score results of classification model
    * \return true if the postprocess successed, otherwise false
    */
   bool Run(const std::vector<FDTensor>& tensors,
diff --git a/fastdeploy/vision/ocr/ppocr/cls_preprocessor.h b/fastdeploy/vision/ocr/ppocr/cls_preprocessor.h
index ed75d55b2..8c1c81611 100644
--- a/fastdeploy/vision/ocr/ppocr/cls_preprocessor.h
+++ b/fastdeploy/vision/ocr/ppocr/cls_preprocessor.h
@@ -26,8 +26,8 @@ class FASTDEPLOY_DECL ClassifierPreprocessor {
  public:
   /** \brief Process the input image and prepare input tensors for runtime
    *
-   * \param[in] images The input image data list, all the elements are returned by cv::imread()
-   * \param[in] outputs The output tensors which will feed in runtime
+   * \param[in] images The input data list, all the elements are FDMat
+   * \param[in] outputs The output tensors which will be fed into runtime
    * \return true if the preprocess successed, otherwise false
    */
   bool Run(std::vector<FDMat>* images, std::vector<FDTensor>* outputs);
diff --git a/fastdeploy/vision/ocr/ppocr/det_preprocessor.h b/fastdeploy/vision/ocr/ppocr/det_preprocessor.h
index d66e785d3..705f19c7b 100644
--- a/fastdeploy/vision/ocr/ppocr/det_preprocessor.h
+++ b/fastdeploy/vision/ocr/ppocr/det_preprocessor.h
@@ -26,7 +26,7 @@ class FASTDEPLOY_DECL DBDetectorPreprocessor {
  public:
   /** \brief Process the input image and prepare input tensors for runtime
    *
-   * \param[in] images The input image data list, all the elements are returned by cv::imread()
+   * \param[in] images The input data list, all the elements are FDMat
    * \param[in] outputs The output tensors which will feed in runtime
    * \param[in] batch_det_img_info_ptr The output of preprocess
    * \return true if the preprocess successed, otherwise false
diff --git a/fastdeploy/vision/ocr/ppocr/rec_postprocessor.h b/fastdeploy/vision/ocr/ppocr/rec_postprocessor.h
index 711ae3a01..5f9aa70f2 100644
--- a/fastdeploy/vision/ocr/ppocr/rec_postprocessor.h
+++ b/fastdeploy/vision/ocr/ppocr/rec_postprocessor.h
@@ -35,8 +35,8 @@ class FASTDEPLOY_DECL RecognizerPostprocessor {
   /** \brief Process the result of runtime and fill to RecognizerResult
    *
    * \param[in] tensors The inference result from runtime
-   * \param[in] texts The output result of recognizer
-   * \param[in] rec_scores The output result of recognizer
+   * \param[in] texts The output text results of recognizer
+   * \param[in] rec_scores The output score results of recognizer
    * \return true if the postprocess successed, otherwise false
    */
   bool Run(const std::vector<FDTensor>& tensors,
diff --git a/fastdeploy/vision/ocr/ppocr/rec_preprocessor.h b/fastdeploy/vision/ocr/ppocr/rec_preprocessor.h
index 1dad75870..c6c942468 100644
--- a/fastdeploy/vision/ocr/ppocr/rec_preprocessor.h
+++ b/fastdeploy/vision/ocr/ppocr/rec_preprocessor.h
@@ -26,8 +26,8 @@ class FASTDEPLOY_DECL RecognizerPreprocessor {
  public:
   /** \brief Process the input image and prepare input tensors for runtime
    *
-   * \param[in] images The input image data list, all the elements are returned by cv::imread()
-   * \param[in] outputs The output tensors which will feed in runtime
+   * \param[in] images The input data list, all the elements are FDMat
+   * \param[in] outputs The output tensors which will be fed into runtime
    * \return true if the preprocess successed, otherwise false
    */
   bool Run(std::vector<FDMat>* images, std::vector<FDTensor>* outputs);
diff --git a/fastdeploy/vision/ocr/ppocr/recognizer.h b/fastdeploy/vision/ocr/ppocr/recognizer.h
index 8a5f5bc70..bba8a4447 100755
--- a/fastdeploy/vision/ocr/ppocr/recognizer.h
+++ b/fastdeploy/vision/ocr/ppocr/recognizer.h
@@ -45,11 +45,19 @@ class FASTDEPLOY_DECL Recognizer : public FastDeployModel {
              const ModelFormat& model_format = ModelFormat::PADDLE);
   /// Get model's name
   std::string ModelName() const { return "ppocr/ocr_rec"; }
+  /** \brief Predict the input image and get OCR recognition model result.
+   *
+   * \param[in] img The input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format.
+   * \param[in] text The text result of rec model will be written into this parameter.
+   * \param[in] rec_score The sccore result of rec model will be written into this parameter.
+   * \return true if the prediction is successed, otherwise false.
+   */
   virtual bool Predict(const cv::Mat& img, std::string* text, float* rec_score);
   /** \brief BatchPredict the input image and get OCR recognition model result.
    *
    * \param[in] images The list of input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format.
-   * \param[in] rec_results The output of OCR recognition model result will be writen to this structure.
+   * \param[in] texts The list of text results of rec model will be written into this vector.
+   * \param[in] rec_scores The list of sccore result of rec model will be written into this vector.
    * \return true if the prediction is successed, otherwise false.
    */
   virtual bool BatchPredict(const std::vector<cv::Mat>& images,

From de72162af9a5bed221e1ec3034f8affe5410bcdb Mon Sep 17 00:00:00 2001
From: WJJ1995 <wjjisloser@163.com>
Date: Wed, 14 Dec 2022 10:14:29 +0800
Subject: [PATCH 45/77] [Serving] Fixed preprocess&&postprocess in YOLOv5
 Serving (#874)

* add onnx_ort_runtime demo

* rm in requirements

* support batch eval

* fixed MattingResults bug

* move assignment for DetectionResult

* integrated x2paddle

* add model convert readme

* update readme

* re-lint

* add processor api

* Add MattingResult Free

* change valid_cpu_backends order

* add ppocr benchmark

* mv bs from 64 to 32

* fixed quantize.md

* fixed quantize bugs

* Add Monitor for benchmark

* update mem monitor

* Set trt_max_batch_size default 1

* fixed ocr benchmark bug

* support yolov5 in serving

* Fixed yolov5 serving

* Fixed postprocess

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 .../serving/models/postprocess/1/model.py     |  1 -
 .../serving/models/postprocess/1/model.py     | 36 +++++--------------
 .../serving/models/preprocess/1/model.py      | 33 ++++++-----------
 3 files changed, 19 insertions(+), 51 deletions(-)
 mode change 100644 => 100755 examples/vision/classification/paddleclas/serving/models/postprocess/1/model.py

diff --git a/examples/vision/classification/paddleclas/serving/models/postprocess/1/model.py b/examples/vision/classification/paddleclas/serving/models/postprocess/1/model.py
old mode 100644
new mode 100755
index b328b249b..0ab7dcdc4
--- a/examples/vision/classification/paddleclas/serving/models/postprocess/1/model.py
+++ b/examples/vision/classification/paddleclas/serving/models/postprocess/1/model.py
@@ -84,7 +84,6 @@ class TritonPythonModel:
           be the same as `requests`
         """
         responses = []
-        # print("num:", len(requests), flush=True)
         for request in requests:
             infer_outputs = pb_utils.get_input_tensor_by_name(
                 request, self.input_names[0])
diff --git a/examples/vision/detection/yolov5/serving/models/postprocess/1/model.py b/examples/vision/detection/yolov5/serving/models/postprocess/1/model.py
index 30a744b68..7c608db43 100644
--- a/examples/vision/detection/yolov5/serving/models/postprocess/1/model.py
+++ b/examples/vision/detection/yolov5/serving/models/postprocess/1/model.py
@@ -61,31 +61,7 @@ class TritonPythonModel:
             dtype = pb_utils.triton_string_to_numpy(output_config["data_type"])
             self.output_dtype.append(dtype)
         print("postprocess output names:", self.output_names)
-
-    def yolov5_postprocess(self, infer_outputs, im_infos):
-        """
-        Parameters
-        ----------
-        infer_outputs : numpy.array
-          Contains the batch of inference results
-        im_infos : numpy.array(b'{}')
-         Returns
-        -------
-        numpy.array
-           yolov5 postprocess result
-        """
-        results = []
-        for i_batch in range(len(im_infos)):
-            new_infer_output = infer_outputs[i_batch:i_batch + 1]
-            new_im_info = im_infos[i_batch].decode('utf-8').replace("'", '"')
-            new_im_info = json.loads(new_im_info)
-
-            result = fd.vision.detection.YOLOv5.postprocess(
-                [new_infer_output, ], new_im_info)
-
-            r_str = fd.vision.utils.fd_result_to_json(result)
-            results.append(r_str)
-        return np.array(results, dtype=np.object)
+        self.postprocessor_ = fd.vision.detection.YOLOv5Postprocessor()
 
     def execute(self, requests):
         """`execute` must be implemented in every Python model. `execute`
@@ -107,7 +83,6 @@ class TritonPythonModel:
           be the same as `requests`
         """
         responses = []
-        # print("num:", len(requests), flush=True)
         for request in requests:
             infer_outputs = pb_utils.get_input_tensor_by_name(
                 request, self.input_names[0])
@@ -115,10 +90,15 @@ class TritonPythonModel:
                                                          self.input_names[1])
             infer_outputs = infer_outputs.as_numpy()
             im_infos = im_infos.as_numpy()
+            for i in range(im_infos.shape[0]):
+                im_infos[i] = json.loads(im_infos[i].decode('utf-8').replace(
+                    "'", '"'))
 
-            results = self.yolov5_postprocess(infer_outputs, im_infos)
+            results = self.postprocessor_.run([infer_outputs], im_infos)
+            r_str = fd.vision.utils.fd_result_to_json(results)
+            r_np = np.array(r_str, dtype=np.object)
 
-            out_tensor = pb_utils.Tensor(self.output_names[0], results)
+            out_tensor = pb_utils.Tensor(self.output_names[0], r_np)
             inference_response = pb_utils.InferenceResponse(
                 output_tensors=[out_tensor, ])
             responses.append(inference_response)
diff --git a/examples/vision/detection/yolov5/serving/models/preprocess/1/model.py b/examples/vision/detection/yolov5/serving/models/preprocess/1/model.py
index cd22aa37b..cf4f7e8e8 100644
--- a/examples/vision/detection/yolov5/serving/models/preprocess/1/model.py
+++ b/examples/vision/detection/yolov5/serving/models/preprocess/1/model.py
@@ -61,21 +61,7 @@ class TritonPythonModel:
             dtype = pb_utils.triton_string_to_numpy(output_config["data_type"])
             self.output_dtype.append(dtype)
         print("preprocess output names:", self.output_names)
-
-    def yolov5_preprocess(self, input_data):
-        """
-        According to Triton input, the preprocessing results of YoloV5 model are obtained.
-        """
-        im_infos = []
-        pre_outputs = []
-        for i_batch in input_data:
-            pre_output, im_info = fd.vision.detection.YOLOv5.preprocess(
-                i_batch)
-            pre_outputs.append(pre_output)
-            im_infos.append(im_info)
-        im_infos = np.array(im_infos, dtype=np.object)
-        pre_outputs = np.concatenate(pre_outputs, axis=0)
-        return pre_outputs, im_infos
+        self.preprocessor_ = fd.vision.detection.YOLOv5Preprocessor()
 
     def execute(self, requests):
         """`execute` must be implemented in every Python model. `execute`
@@ -97,18 +83,21 @@ class TritonPythonModel:
           be the same as `requests`
         """
         responses = []
-        # print("num:", len(requests), flush=True)
         for request in requests:
             data = pb_utils.get_input_tensor_by_name(request,
                                                      self.input_names[0])
             data = data.as_numpy()
-            outputs = self.yolov5_preprocess(data)
-            output_tensors = []
-            for idx, output in enumerate(outputs):
-                output_tensors.append(
-                    pb_utils.Tensor(self.output_names[idx], output))
+            outputs, im_infos = self.preprocessor_.run(data)
+
+            # YOLOv5 preprocess has two output
+            dlpack_tensor = outputs[0].to_dlpack()
+            output_tensor_0 = pb_utils.Tensor.from_dlpack(self.output_names[0],
+                                                          dlpack_tensor)
+            output_tensor_1 = pb_utils.Tensor(
+                self.output_names[1], np.array(
+                    im_infos, dtype=np.object))
             inference_response = pb_utils.InferenceResponse(
-                output_tensors=output_tensors)
+                output_tensors=[output_tensor_0, output_tensor_1])
             responses.append(inference_response)
         return responses
 

From d8bbc8c8c417ac849041d7e720bee079ed7d53ad Mon Sep 17 00:00:00 2001
From: yeliang2258 <30516196+yeliang2258@users.noreply.github.com>
Date: Wed, 14 Dec 2022 10:23:44 +0800
Subject: [PATCH 46/77] [Doc] Add KunlunXin XPU supported models (#868)

* add xpu supported models

* update cn doc

* update EN and CN doc
---
 README_CN.md | 138 +++++++++++++++++++++++++--------------------------
 README_EN.md | 138 +++++++++++++++++++++++++--------------------------
 2 files changed, 138 insertions(+), 138 deletions(-)

diff --git a/README_CN.md b/README_CN.md
index 2cbf2ff45..28ef9f0b4 100755
--- a/README_CN.md
+++ b/README_CN.md
@@ -186,75 +186,75 @@ int main(int argc, char* argv[]) {
   <img src="https://user-images.githubusercontent.com/54695910/198619323-c9b1cbce-1c1c-4f92-9737-4805c7c0ff2f.png" />
 </div>
 
-| 任务场景                   | 模型                                                                                           | Linux                                            | Linux      | Win     | Win        | Mac     | Mac     | Linux       | Linux           | Linux         | Linux         | Linux   |
-|:----------------------:|:--------------------------------------------------------------------------------------------:|:------------------------------------------------:|:----------:|:-------:|:----------:|:-------:|:-------:|:-----------:|:---------------:|:-------------:|:-------------:|:-------:|
-| ---                    | ---                                                                                          | X86 CPU                                          | NVIDIA GPU | X86 CPU | NVIDIA GPU | X86 CPU | Arm CPU | AArch64 CPU | 飞腾D2000 aarch64 | NVIDIA Jetson | Graphcore IPU | Serving |
-| Classification         | [PaddleClas/ResNet50](./examples/vision/classification/paddleclas)                           | [✅](./examples/vision/classification/paddleclas) | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [TorchVison/ResNet](examples/vision/classification/resnet)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Classification         | [ltralytics/YOLOv5Cls](examples/vision/classification/yolov5cls)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Classification         | [PaddleClas/PP-LCNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/PP-LCNetv2](./examples/vision/classification/paddleclas)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/EfficientNet](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/GhostNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/MobileNetV1](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/MobileNetV2](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/MobileNetV3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/ShuffleNetV2](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/SqueeezeNetV1.1](./examples/vision/classification/paddleclas)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/Inceptionv3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Classification         | [PaddleClas/PP-HGNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Detection              | [PaddleDetection/PP-YOLOE](./examples/vision/detection/paddledetection)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/PicoDet](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/YOLOX](./examples/vision/detection/paddledetection)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅               | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/YOLOv3](./examples/vision/detection/paddledetection)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/PP-YOLO](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/PP-YOLOv2](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/Faster-RCNN](./examples/vision/detection/paddledetection)                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/Mask-RCNN](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [Megvii-BaseDetection/YOLOX](./examples/vision/detection/yolox)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [WongKinYiu/YOLOv7](./examples/vision/detection/yolov7)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [WongKinYiu/YOLOv7end2end_trt](./examples/vision/detection/yolov7end2end_trt)                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Detection              | [WongKinYiu/YOLOv7end2end_ort_](./examples/vision/detection/yolov7end2end_ort)               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [meituan/YOLOv6](./examples/vision/detection/yolov6)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [ultralytics/YOLOv5](./examples/vision/detection/yolov5)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [WongKinYiu/YOLOR](./examples/vision/detection/yolor)                                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Detection              | [WongKinYiu/ScaledYOLOv4](./examples/vision/detection/scaledyolov4)                          | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [ppogg/YOLOv5Lite](./examples/vision/detection/yolov5lite)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [RangiLyu/NanoDetPlus](./examples/vision/detection/nanodet_plus)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| KeyPoint               | [PaddleDetection/TinyPose](./examples/vision/keypointdetection/tiny_pose)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| KeyPoint               | [PaddleDetection/PicoDet + TinyPose](./examples/vision/keypointdetection/det_keypoint_unite) | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| HeadPose               | [omasaht/headpose](examples/vision/headpose)                                                 | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Tracking               | [PaddleDetection/PP-Tracking](examples/vision/tracking/pptracking)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| OCR                    | [PaddleOCR/PP-OCRv2](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| OCR                    | [PaddleOCR/PP-OCRv3](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Segmentation           | [PaddleSeg/PP-LiteSeg](./examples/vision/segmentation/paddleseg)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/PP-HumanSegLite](./examples/vision/segmentation/paddleseg)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/HRNet](./examples/vision/segmentation/paddleseg)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/PP-HumanSegServer](./examples/vision/segmentation/paddleseg)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/Unet](./examples/vision/segmentation/paddleseg)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/Deeplabv3](./examples/vision/segmentation/paddleseg)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| FaceDetection          | [biubug6/RetinaFace](./examples/vision/facedet/retinaface)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceDetection          | [Linzaer/UltraFace](./examples/vision/facedet/ultraface)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceDetection          | [deepcam-cn/YOLOv5Face](./examples/vision/facedet/yolov5face)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceDetection          | [insightface/SCRFD](./examples/vision/facedet/scrfd)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceAlign              | [Hsintao/PFLD](examples/vision/facealign/pfld)                                               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceAlign              | [Single430FaceLandmark1000](./examples/vision/facealign/face_landmark_1000)                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| FaceAlign              | [jhb86253817/PIPNet](./examples/vision/facealign)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| FaceRecognition        | [insightface/ArcFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceRecognition        | [insightface/CosFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceRecognition        | [insightface/PartialFC](./examples/vision/faceid/insightface)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceRecognition        | [insightface/VPL](./examples/vision/faceid/insightface)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Matting                | [ZHKKKe/MODNet](./examples/vision/matting/modnet)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Matting                | [PeterL1n/RobustVideoMatting]()                                                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Matting                | [PaddleSeg/PP-Matting](./examples/vision/matting/ppmatting)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Matting                | [PaddleSeg/PP-HumanMatting](./examples/vision/matting/modnet)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Matting                | [PaddleSeg/ModNet](./examples/vision/matting/modnet)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Video Super-Resolution | [PaddleGAN/BasicVSR](./)                                                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Video Super-Resolution | [PaddleGAN/EDVR](./examples/vision/sr/edvr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Video Super-Resolution | [PaddleGAN/PP-MSVSR](./examples/vision/sr/ppmsvsr)                                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Information Extraction | [PaddleNLP/UIE](./examples/text/uie)                                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           |         |
-| NLP                    | [PaddleNLP/ERNIE-3.0](./examples/text/ernie-3.0)                                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | ❔                           | ✅       |
-| Speech                 | [PaddleSpeech/PP-TTS](./examples/audio/pp-tts)                                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | --                          | ✅       |
+| 任务场景                   | 模型                                                                                           | Linux                                            | Linux      | Win     | Win        | Mac     | Mac     | Linux       | Linux           | Linux         | Linux         | Linux   | Linux   |
+|:----------------------:|:--------------------------------------------------------------------------------------------:|:------------------------------------------------:|:----------:|:-------:|:----------:|:-------:|:-------:|:-----------:|:---------------:|:-------------:|:-------------:|:-------:|:-------:|
+| ---                    | ---                                                                                          | X86 CPU                                          | NVIDIA GPU | X86 CPU | NVIDIA GPU | X86 CPU | Arm CPU | AArch64 CPU | 飞腾D2000 aarch64 | NVIDIA Jetson | Graphcore IPU | KunlunXin XPU | Serving |
+| Classification         | [PaddleClas/ResNet50](./examples/vision/classification/paddleclas)                           | [✅](./examples/vision/classification/paddleclas) | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [TorchVison/ResNet](examples/vision/classification/resnet)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Classification         | [ltralytics/YOLOv5Cls](examples/vision/classification/yolov5cls)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Classification         | [PaddleClas/PP-LCNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           |  ✅       | ✅       |
+| Classification         | [PaddleClas/PP-LCNetv2](./examples/vision/classification/paddleclas)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/EfficientNet](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/GhostNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/MobileNetV1](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/MobileNetV2](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/MobileNetV3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/ShuffleNetV2](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/SqueeezeNetV1.1](./examples/vision/classification/paddleclas)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/Inceptionv3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Classification         | [PaddleClas/PP-HGNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOE](./examples/vision/detection/paddledetection)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/PicoDet](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/YOLOX](./examples/vision/detection/paddledetection)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅               | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/YOLOv3](./examples/vision/detection/paddledetection)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/PP-YOLO](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOv2](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/Faster-RCNN](./examples/vision/detection/paddledetection)                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/Mask-RCNN](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [Megvii-BaseDetection/YOLOX](./examples/vision/detection/yolox)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Detection              | [WongKinYiu/YOLOv7](./examples/vision/detection/yolov7)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_trt](./examples/vision/detection/yolov7end2end_trt)                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_ort_](./examples/vision/detection/yolov7end2end_ort)               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| Detection              | [meituan/YOLOv6](./examples/vision/detection/yolov6)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅                          | ❔       |
+| Detection              | [ultralytics/YOLOv5](./examples/vision/detection/yolov5)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [WongKinYiu/YOLOR](./examples/vision/detection/yolor)                                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔      | ❔       |
+| Detection              | [WongKinYiu/ScaledYOLOv4](./examples/vision/detection/scaledyolov4)                          | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| Detection              | [ppogg/YOLOv5Lite](./examples/vision/detection/yolov5lite)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           |  ?       | ❔       |❔       |
+| Detection              | [RangiLyu/NanoDetPlus](./examples/vision/detection/nanodet_plus)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| KeyPoint               | [PaddleDetection/TinyPose](./examples/vision/keypointdetection/tiny_pose)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅        | ❔       |
+| KeyPoint               | [PaddleDetection/PicoDet + TinyPose](./examples/vision/keypointdetection/det_keypoint_unite) | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅        | ❔       |
+| HeadPose               | [omasaht/headpose](examples/vision/headpose)                                                 | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Tracking               | [PaddleDetection/PP-Tracking](examples/vision/tracking/pptracking)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv2](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅              | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv3](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Segmentation           | [PaddleSeg/PP-LiteSeg](./examples/vision/segmentation/paddleseg)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅                 | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegLite](./examples/vision/segmentation/paddleseg)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅                     | ❔       |
+| Segmentation           | [PaddleSeg/HRNet](./examples/vision/segmentation/paddleseg)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅                | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegServer](./examples/vision/segmentation/paddleseg)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅        | ❔       |
+| Segmentation           | [PaddleSeg/Unet](./examples/vision/segmentation/paddleseg)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ✅               | ✅         | ❔       |
+| Segmentation           | [PaddleSeg/Deeplabv3](./examples/vision/segmentation/paddleseg)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                     | ✅               | ❔       |
+| FaceDetection          | [biubug6/RetinaFace](./examples/vision/facedet/retinaface)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                  | ❔       |  ❔       |
+| FaceDetection          | [Linzaer/UltraFace](./examples/vision/facedet/ultraface)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ❔       | ❔       |
+| FaceDetection          | [deepcam-cn/YOLOv5Face](./examples/vision/facedet/yolov5face)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ❔       | ❔       |
+| FaceDetection          | [insightface/SCRFD](./examples/vision/facedet/scrfd)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ❔       | ❔       |
+| FaceAlign              | [Hsintao/PFLD](examples/vision/facealign/pfld)                                               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    |  ❔       |❔       |
+| FaceAlign              | [Single430/FaceLandmark1000](./examples/vision/facealign/face_landmark_1000)                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    | ❔       | ❔       |
+| FaceAlign              | [jhb86253817/PIPNet](./examples/vision/facealign)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    | ❔       |❔       |
+| FaceRecognition        | [insightface/ArcFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ❔       | ❔       |
+| FaceRecognition        | [insightface/CosFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ❔       | ❔       |
+| FaceRecognition        | [insightface/PartialFC](./examples/vision/faceid/insightface)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ❔       | ❔       |
+| FaceRecognition        | [insightface/VPL](./examples/vision/faceid/insightface)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ❔       | ❔       |
+| Matting                | [ZHKKKe/MODNet](./examples/vision/matting/modnet)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    |  ❔       |❔       |
+| Matting                | [PeterL1n/RobustVideoMatting]()                                                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    | ❔       |  ❔       |
+| Matting                | [PaddleSeg/PP-Matting](./examples/vision/matting/ppmatting)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ✅           | ❔       |
+| Matting                | [PaddleSeg/PP-HumanMatting](./examples/vision/matting/modnet)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                   | ✅       |❔       |
+| Matting                | [PaddleSeg/ModNet](./examples/vision/matting/modnet)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                    | ❔        |   ❔       |
+| Video Super-Resolution | [PaddleGAN/BasicVSR](./)                                                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    | ❔       | ❔       |
+| Video Super-Resolution | [PaddleGAN/EDVR](./examples/vision/sr/edvr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    | ❔       | ❔       |
+| Video Super-Resolution | [PaddleGAN/PP-MSVSR](./examples/vision/sr/ppmsvsr)                                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    | ❔       | ❔       |
+| Information Extraction | [PaddleNLP/UIE](./examples/text/uie)                                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    | ❔         |         |
+| NLP                    | [PaddleNLP/ERNIE-3.0](./examples/text/ernie-3.0)                                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | ❔                    | ✅       | ✅       |
+| Speech                 | [PaddleSpeech/PP-TTS](./examples/audio/pp-tts)                                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | --                          |❔       | ✅       |
 
 
 </div></details>
diff --git a/README_EN.md b/README_EN.md
index 3abffec44..d6f5d1405 100755
--- a/README_EN.md
+++ b/README_EN.md
@@ -186,75 +186,75 @@ Notes: ✅: already supported; ❔: to be supported in the future;  N/A: Not Ava
   <img src="https://user-images.githubusercontent.com/54695910/198620704-741523c1-dec7-44e5-9f2b-29ddd9997344.png" />
 </div>
 
-| Task                   | Model                                                                                        | Linux                                            | Linux                    | Win                      | Win                      | Mac                     | Mac                   | Linux                      | Linux            | Linux                       | Linux                       | Linux   |
-|:----------------------:|:--------------------------------------------------------------------------------------------:|:------------------------------------------------:|:------------------------:|:------------------------:|:------------------------:|:-----------------------:|:---------------------:|:--------------------------:| :----------------: |:---------------------------:|:---------------------------:|:-------:|
-| ---                    | ---                                                                                          | <font size=2> X86 CPU                            | <font size=2> NVIDIA GPU | <font size=2> Intel  CPU | <font size=2> NVIDIA GPU | <font size=2> Intel CPU | <font size=2> Arm CPU | <font size=2>  AArch64 CPU | Phytium D2000CPU | <font size=2> NVIDIA Jetson | <font size=2> Graphcore IPU | Serving |
-| Classification         | [PaddleClas/ResNet50](./examples/vision/classification/paddleclas)                           | [✅](./examples/vision/classification/paddleclas) | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [TorchVison/ResNet](examples/vision/classification/resnet)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Classification         | [ltralytics/YOLOv5Cls](examples/vision/classification/yolov5cls)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Classification         | [PaddleClas/PP-LCNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/PP-LCNetv2](./examples/vision/classification/paddleclas)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/EfficientNet](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/GhostNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/MobileNetV1](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/MobileNetV2](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/MobileNetV3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/ShuffleNetV2](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/SqueeezeNetV1.1](./examples/vision/classification/paddleclas)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Classification         | [PaddleClas/Inceptionv3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Classification         | [PaddleClas/PP-HGNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       |
-| Detection              | [PaddleDetection/PP-YOLOE](./examples/vision/detection/paddledetection)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/PicoDet](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/YOLOX](./examples/vision/detection/paddledetection)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅               | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/YOLOv3](./examples/vision/detection/paddledetection)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/PP-YOLO](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/PP-YOLOv2](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/Faster-RCNN](./examples/vision/detection/paddledetection)                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [PaddleDetection/Mask-RCNN](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [Megvii-BaseDetection/YOLOX](./examples/vision/detection/yolox)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [WongKinYiu/YOLOv7](./examples/vision/detection/yolov7)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [WongKinYiu/YOLOv7end2end_trt](./examples/vision/detection/yolov7end2end_trt)                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Detection              | [WongKinYiu/YOLOv7end2end_ort_](./examples/vision/detection/yolov7end2end_ort)               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [meituan/YOLOv6](./examples/vision/detection/yolov6)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [ultralytics/YOLOv5](./examples/vision/detection/yolov5)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Detection              | [WongKinYiu/YOLOR](./examples/vision/detection/yolor)                                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Detection              | [WongKinYiu/ScaledYOLOv4](./examples/vision/detection/scaledyolov4)                          | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [ppogg/YOLOv5Lite](./examples/vision/detection/yolov5lite)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Detection              | [RangiLyu/NanoDetPlus](./examples/vision/detection/nanodet_plus)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| KeyPoint               | [PaddleDetection/TinyPose](./examples/vision/keypointdetection/tiny_pose)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| KeyPoint               | [PaddleDetection/PicoDet + TinyPose](./examples/vision/keypointdetection/det_keypoint_unite) | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| HeadPose               | [omasaht/headpose](examples/vision/headpose)                                                 | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Tracking               | [PaddleDetection/PP-Tracking](examples/vision/tracking/pptracking)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| OCR                    | [PaddleOCR/PP-OCRv2](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| OCR                    | [PaddleOCR/PP-OCRv3](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       |
-| Segmentation           | [PaddleSeg/PP-LiteSeg](./examples/vision/segmentation/paddleseg)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/PP-HumanSegLite](./examples/vision/segmentation/paddleseg)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/HRNet](./examples/vision/segmentation/paddleseg)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/PP-HumanSegServer](./examples/vision/segmentation/paddleseg)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/Unet](./examples/vision/segmentation/paddleseg)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Segmentation           | [PaddleSeg/Deeplabv3](./examples/vision/segmentation/paddleseg)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| FaceDetection          | [biubug6/RetinaFace](./examples/vision/facedet/retinaface)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceDetection          | [Linzaer/UltraFace](./examples/vision/facedet/ultraface)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceDetection          | [deepcam-cn/YOLOv5Face](./examples/vision/facedet/yolov5face)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceDetection          | [insightface/SCRFD](./examples/vision/facedet/scrfd)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceAlign              | [Hsintao/PFLD](examples/vision/facealign/pfld)                                               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceAlign              | [Single430FaceLandmark1000](./examples/vision/facealign/face_landmark_1000)                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| FaceAlign              | [jhb86253817/PIPNet](./examples/vision/facealign)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| FaceRecognition        | [insightface/ArcFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceRecognition        | [insightface/CosFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceRecognition        | [insightface/PartialFC](./examples/vision/faceid/insightface)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| FaceRecognition        | [insightface/VPL](./examples/vision/faceid/insightface)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Matting                | [ZHKKKe/MODNet](./examples/vision/matting/modnet)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Matting                | [PeterL1n/RobustVideoMatting]()                                                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Matting                | [PaddleSeg/PP-Matting](./examples/vision/matting/ppmatting)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Matting                | [PaddleSeg/PP-HumanMatting](./examples/vision/matting/modnet)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Matting                | [PaddleSeg/ModNet](./examples/vision/matting/modnet)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       |
-| Video Super-Resolution | [PaddleGAN/BasicVSR](./)                                                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Video Super-Resolution | [PaddleGAN/EDVR](./examples/vision/sr/edvr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Video Super-Resolution | [PaddleGAN/PP-MSVSR](./examples/vision/sr/ppmsvsr)                                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |
-| Information Extraction | [PaddleNLP/UIE](./examples/text/uie)                                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           |         |
-| NLP                    | [PaddleNLP/ERNIE-3.0](./examples/text/ernie-3.0)                                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | ❔                           | ✅       |
-| Speech                 | [PaddleSpeech/PP-TTS](./examples/audio/pp-tts)                                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | --                          | ✅       |
+| Task                   | Model                                                                                        | Linux                                            | Linux                    | Win                      | Win                      | Mac                     | Mac                   | Linux                      | Linux            | Linux                       | Linux                       | Linux   | Linux   |
+|:----------------------:|:--------------------------------------------------------------------------------------------:|:------------------------------------------------:|:------------------------:|:------------------------:|:------------------------:|:-----------------------:|:---------------------:|:--------------------------:| :----------------: |:---------------------------:|:---------------------------:|:-------:|:-------:|
+| ---                    | ---                                                                                          | <font size=2> X86 CPU                            | <font size=2> NVIDIA GPU | <font size=2> Intel  CPU | <font size=2> NVIDIA GPU | <font size=2> Intel CPU | <font size=2> Arm CPU | <font size=2>  AArch64 CPU | Phytium D2000CPU | <font size=2> NVIDIA Jetson | <font size=2> Graphcore IPU | KunlunXin XPU |Serving |
+| Classification         | [PaddleClas/ResNet50](./examples/vision/classification/paddleclas)                           | [✅](./examples/vision/classification/paddleclas) | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [TorchVison/ResNet](examples/vision/classification/resnet)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Classification         | [ltralytics/YOLOv5Cls](examples/vision/classification/yolov5cls)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Classification         | [PaddleClas/PP-LCNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/PP-LCNetv2](./examples/vision/classification/paddleclas)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/EfficientNet](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/GhostNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/MobileNetV1](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/MobileNetV2](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/MobileNetV3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/ShuffleNetV2](./examples/vision/classification/paddleclas)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/SqueeezeNetV1.1](./examples/vision/classification/paddleclas)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅       | ✅       |
+| Classification         | [PaddleClas/Inceptionv3](./examples/vision/classification/paddleclas)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Classification         | [PaddleClas/PP-HGNet](./examples/vision/classification/paddleclas)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ✅                           | ✅      | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOE](./examples/vision/detection/paddledetection)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/PicoDet](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/YOLOX](./examples/vision/detection/paddledetection)                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅               | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/YOLOv3](./examples/vision/detection/paddledetection)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/PP-YOLO](./examples/vision/detection/paddledetection)                       | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅      | ✅       |
+| Detection              | [PaddleDetection/PP-YOLOv2](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/Faster-RCNN](./examples/vision/detection/paddledetection)                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [PaddleDetection/Mask-RCNN](./examples/vision/detection/paddledetection)                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [Megvii-BaseDetection/YOLOX](./examples/vision/detection/yolox)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Detection              | [WongKinYiu/YOLOv7](./examples/vision/detection/yolov7)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_trt](./examples/vision/detection/yolov7end2end_trt)                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Detection              | [WongKinYiu/YOLOv7end2end_ort_](./examples/vision/detection/yolov7end2end_ort)               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| Detection              | [meituan/YOLOv6](./examples/vision/detection/yolov6)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| Detection              | [ultralytics/YOLOv5](./examples/vision/detection/yolov5)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Detection              | [WongKinYiu/YOLOR](./examples/vision/detection/yolor)                                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Detection              | [WongKinYiu/ScaledYOLOv4](./examples/vision/detection/scaledyolov4)                          | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| Detection              | [ppogg/YOLOv5Lite](./examples/vision/detection/yolov5lite)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| Detection              | [RangiLyu/NanoDetPlus](./examples/vision/detection/nanodet_plus)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| KeyPoint               | [PaddleDetection/TinyPose](./examples/vision/keypointdetection/tiny_pose)                    | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| KeyPoint               | [PaddleDetection/PicoDet + TinyPose](./examples/vision/keypointdetection/det_keypoint_unite) | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ❔       |
+| HeadPose               | [omasaht/headpose](examples/vision/headpose)                                                 | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Tracking               | [PaddleDetection/PP-Tracking](examples/vision/tracking/pptracking)                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv2](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅       | ❔       |
+| OCR                    | [PaddleOCR/PP-OCRv3](./examples/vision/ocr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅       | ✅       |
+| Segmentation           | [PaddleSeg/PP-LiteSeg](./examples/vision/segmentation/paddleseg)                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅       | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegLite](./examples/vision/segmentation/paddleseg)                        | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅      | ❔       |
+| Segmentation           | [PaddleSeg/HRNet](./examples/vision/segmentation/paddleseg)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅      | ❔       |
+| Segmentation           | [PaddleSeg/PP-HumanSegServer](./examples/vision/segmentation/paddleseg)                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅       | ❔       |
+| Segmentation           | [PaddleSeg/Unet](./examples/vision/segmentation/paddleseg)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ✅       | ❔       |
+| Segmentation           | [PaddleSeg/Deeplabv3](./examples/vision/segmentation/paddleseg)                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                    | ✅       | ❔       |
+| FaceDetection          | [biubug6/RetinaFace](./examples/vision/facedet/retinaface)                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceDetection          | [Linzaer/UltraFace](./examples/vision/facedet/ultraface)                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceDetection          | [deepcam-cn/YOLOv5Face](./examples/vision/facedet/yolov5face)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceDetection          | [insightface/SCRFD](./examples/vision/facedet/scrfd)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceAlign              | [Hsintao/PFLD](examples/vision/facealign/pfld)                                               | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceAlign              | [Single430FaceLandmark1000](./examples/vision/facealign/face_landmark_1000)                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceAlign              | [jhb86253817/PIPNet](./examples/vision/facealign)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceRecognition        | [insightface/ArcFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceRecognition        | [insightface/CosFace](./examples/vision/faceid/insightface)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceRecognition        | [insightface/PartialFC](./examples/vision/faceid/insightface)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| FaceRecognition        | [insightface/VPL](./examples/vision/faceid/insightface)                                      | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| Matting                | [ZHKKKe/MODNet](./examples/vision/matting/modnet)                                            | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Matting                | [PeterL1n/RobustVideoMatting]()                                                              | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Matting                | [PaddleSeg/PP-Matting](./examples/vision/matting/ppmatting)                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅         | ❔       |
+| Matting                | [PaddleSeg/PP-HumanMatting](./examples/vision/matting/modnet)                                | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ✅         | ❔       |
+| Matting                | [PaddleSeg/ModNet](./examples/vision/matting/modnet)                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ✅                | ✅                           | ❔                           | ❔       | ❔       |
+| Video Super-Resolution | [PaddleGAN/BasicVSR](./)                                                                     | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Video Super-Resolution | [PaddleGAN/EDVR](./examples/vision/sr/edvr)                                                  | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Video Super-Resolution | [PaddleGAN/PP-MSVSR](./examples/vision/sr/ppmsvsr)                                           | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       | ❔       |
+| Information Extraction | [PaddleNLP/UIE](./examples/text/uie)                                                         | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ✅                           | ❔                           | ❔       |         |
+| NLP                    | [PaddleNLP/ERNIE-3.0](./examples/text/ernie-3.0)                                             | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | ❔                           | ✅         | ✅       |
+| Speech                 | [PaddleSpeech/PP-TTS](./examples/audio/pp-tts)                                                   | ✅                                                | ✅                        | ✅                        | ✅                        | ✅                       | ✅                     | ✅                          | ❔                | ❔                           | --                          | ❔       | ✅       |
 
 </div></details>
 

From c4852a84404a99b6d855572fd047951b4a8ea7e6 Mon Sep 17 00:00:00 2001
From: Winter <1558270516@qq.com>
Date: Wed, 14 Dec 2022 12:53:38 +0800
Subject: [PATCH 47/77] [Android] Change text package name (#866)

* [Android]add VoiceAssistant.

* Create VoiceAssistantDemo

* Update and rename VoiceAssistantDemo to VoiceAssistantDemo.md

* Update VoiceAssistantDemo.md

* Delete VoiceAssistantDemo.md

* [Android]1.delete about core folder.
2.build and configure bdasr_V3_20210628_cfe8c44.aar file.

* change app/build.gradle etc.

* Update build.gradle

* change package name.

Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com>
---
 .../applications/VoiceAssistantMainActivity.java               | 3 +--
 .../applications/VoiceAssistantWelcomeActivity.java            | 2 +-
 2 files changed, 2 insertions(+), 3 deletions(-)
 rename java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/{ernie => text}/applications/VoiceAssistantMainActivity.java (98%)
 rename java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/{ernie => text}/applications/VoiceAssistantWelcomeActivity.java (93%)

diff --git a/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantMainActivity.java b/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/text/applications/VoiceAssistantMainActivity.java
similarity index 98%
rename from java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantMainActivity.java
rename to java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/text/applications/VoiceAssistantMainActivity.java
index cd1592502..8b96cea31 100644
--- a/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantMainActivity.java
+++ b/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/text/applications/VoiceAssistantMainActivity.java
@@ -1,4 +1,4 @@
-package com.baidu.paddle.fastdeploy.app.examples.ernie.applications;
+package com.baidu.paddle.fastdeploy.app.examples.text.applications;
 
 import static com.baidu.paddle.fastdeploy.ui.Utils.isNetworkAvailable;
 
@@ -32,7 +32,6 @@ import com.baidu.speech.asr.SpeechConstant;
 import org.json.JSONObject;
 
 import java.util.ArrayList;
-import java.util.LinkedHashMap;
 import java.util.List;
 import java.util.Map;
 
diff --git a/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantWelcomeActivity.java b/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/text/applications/VoiceAssistantWelcomeActivity.java
similarity index 93%
rename from java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantWelcomeActivity.java
rename to java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/text/applications/VoiceAssistantWelcomeActivity.java
index f81c1c0ca..5dbf8a7ac 100644
--- a/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/ernie/applications/VoiceAssistantWelcomeActivity.java
+++ b/java/android/app/src/main/java/com/baidu/paddle/fastdeploy/app/examples/text/applications/VoiceAssistantWelcomeActivity.java
@@ -1,4 +1,4 @@
-package com.baidu.paddle.fastdeploy.app.examples.ernie.applications;
+package com.baidu.paddle.fastdeploy.app.examples.text.applications;
 
 import android.app.Activity;
 import android.content.Intent;

From 2bdf40a5470427504f82b19fe2bccc06a3a895ae Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 13:55:49 +0800
Subject: [PATCH 48/77] Update README.md

---
 tutorials/intel_gpu/README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tutorials/intel_gpu/README.md b/tutorials/intel_gpu/README.md
index 7c641f512..41c022fa0 100644
--- a/tutorials/intel_gpu/README.md
+++ b/tutorials/intel_gpu/README.md
@@ -11,7 +11,7 @@ FastDeploy provides two examples for these situations in this directory
 
 ## Fixed input shape
 
-While deploying a computer vision model, it includes 3 steps
+While deploying a compute vision model, it includes 3 steps
 - Input a image data, after the preprocessing steps, we get the `tensors` which will be feed to the deeplearning model
 - Inference the model by Runtime with the input `tensors`, and get the output `tensors`
 - Postprocessing the output `tensors`, and get the final results we need, e.g `DetectionResult`, `SegmentationResult`

From 9b7cc1fb32a772082c99eb6cc030034152b0a7bd Mon Sep 17 00:00:00 2001
From: zhoushunjie <zhoushunjie@baidu.com>
Date: Wed, 14 Dec 2022 08:36:10 +0000
Subject: [PATCH 49/77] Fix uie python results bug

---
 python/fastdeploy/text/uie/__init__.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/python/fastdeploy/text/uie/__init__.py b/python/fastdeploy/text/uie/__init__.py
index 642adc882..00ed67a90 100644
--- a/python/fastdeploy/text/uie/__init__.py
+++ b/python/fastdeploy/text/uie/__init__.py
@@ -86,7 +86,8 @@ class UIEModel(FastDeployModel):
         for result in results:
             uie_result = dict()
             for key, uie_results in result.items():
+                uie_result[key] = list()
                 for uie_res in uie_results:
-                    uie_result[key] = uie_res.get_dict()
+                    uie_result[key].append(uie_res.get_dict())
             new_results += [uie_result]
         return new_results

From 2e342a35ba336bbf3b058501fcc3570260f2a67e Mon Sep 17 00:00:00 2001
From: DefTruth <31974251+DefTruth@users.noreply.github.com>
Date: Wed, 14 Dec 2022 16:43:02 +0800
Subject: [PATCH 50/77] [Bug Fix] Fix gflags download timeout (#878)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* [Doc] Add docs_i18n

* [cmake] fix gflags timeout

* Delete README_Ру́сский_язы́к.md

* Delete README_한국어.md

* Create README_Ру́сский_язы́к.md

* Delete README_Ру́сский_язы́к.md

* Update CMakeLists.txt

Co-authored-by: Jason <928090362@qq.com>
---
 CMakeLists.txt     |  1 -
 cmake/gflags.cmake | 81 +++++++++++++++++++++++-----------------------
 2 files changed, 41 insertions(+), 41 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 667951e71..c02e887a5 100755
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -589,7 +589,6 @@ install(
   DESTINATION ${CMAKE_INSTALL_PREFIX}
 )
 
-
 install(
   DIRECTORY ${PROJECT_SOURCE_DIR}/examples
   DESTINATION ${CMAKE_INSTALL_PREFIX}
diff --git a/cmake/gflags.cmake b/cmake/gflags.cmake
index bf20cc2ab..37ee2c4de 100644
--- a/cmake/gflags.cmake
+++ b/cmake/gflags.cmake
@@ -14,9 +14,6 @@
 
 INCLUDE(ExternalProject)
 
-if(NOT GIT_URL)
-  SET(GIT_URL "https://github.com")
-endif()
 if(THIRD_PARTY_PATH)
   SET(GFLAGS_PREFIX_DIR  ${THIRD_PARTY_PATH}/gflags)
   SET(GFLAGS_INSTALL_DIR ${THIRD_PARTY_PATH}/install/gflags)
@@ -26,8 +23,16 @@ else()
   SET(GFLAGS_INSTALL_DIR ${FASTDEPLOY_INSTALL_DIR}/installed_fastdeploy/cmake/gflags)
 endif()
 SET(GFLAGS_INCLUDE_DIR "${GFLAGS_INSTALL_DIR}/include" CACHE PATH "gflags include directory." FORCE)
-set(GFLAGS_REPOSITORY ${GIT_URL}/gflags/gflags.git)
-set(GFLAGS_TAG "v2.2.2")
+set(GFLAGS_SOURCE_FILE ${GFLAGS_PREFIX_DIR}/src/gflags.tgz CACHE PATH "gflags source file." FORCE)
+
+set(GFLAGS_URL_PREFIX "https://bj.bcebos.com/fastdeploy/third_libs")
+set(GFLAGS_URL ${GFLAGS_URL_PREFIX}/gflags.tgz)
+set(GFLAGS_CACHE_FILE ${CMAKE_CURRENT_LIST_DIR}/gflags.tgz)
+if(EXISTS ${GFLAGS_CACHE_FILE})
+  set(GFLAGS_URL ${GFLAGS_CACHE_FILE} CACHE PATH "gflags cache file." FORCE)
+  set(GFLAGS_SOURCE_FILE ${GFLAGS_CACHE_FILE} CACHE PATH "gflags source file." FORCE)
+endif()
+
 IF(WIN32)
   set(GFLAGS_LIBRARIES "${GFLAGS_INSTALL_DIR}/lib/gflags_static.lib" CACHE FILEPATH "GFLAGS_LIBRARIES" FORCE)
 ELSE(WIN32)
@@ -40,45 +45,41 @@ INCLUDE_DIRECTORIES(${GFLAGS_INCLUDE_DIR})
 
 if(ANDROID)
   ExternalProject_Add(
-      extern_gflags
-      ${EXTERNAL_PROJECT_LOG_ARGS}
-      ${SHALLOW_CLONE}
-      GIT_REPOSITORY  ${GFLAGS_REPOSITORY}
-      GIT_TAG         ${GFLAGS_TAG}
-      PREFIX          ${GFLAGS_PREFIX_DIR}
-      UPDATE_COMMAND  ""
-      BUILD_COMMAND   ${BUILD_COMMAND}
-      INSTALL_COMMAND ${INSTALL_COMMAND}
-      CMAKE_ARGS      -DCMAKE_TOOLCHAIN_FILE=${CMAKE_TOOLCHAIN_FILE}
-                      -DANDROID_ABI=${ANDROID_ABI}
-                      -DANDROID_NDK=${ANDROID_NDK}
-                      -DANDROID_PLATFORM=${ANDROID_PLATFORM}
-                      -DANDROID_STL=c++_static
-                      -DANDROID_TOOLCHAIN=${ANDROID_TOOLCHAIN}
-                      -DCMAKE_CXX_FLAGS=${CMAKE_CXX_FLAGS}
-                      -DCMAKE_CXX_FLAGS_RELEASE=${CMAKE_CXX_FLAGS_RELEASE}
-                      -DCMAKE_CXX_FLAGS_DEBUG=${CMAKE_CXX_FLAGS_DEBUG}
-                      -DCMAKE_C_FLAGS=${CMAKE_C_FLAGS}
-                      -DCMAKE_C_FLAGS_DEBUG=${CMAKE_C_FLAGS_DEBUG}
-                      -DCMAKE_C_FLAGS_RELEASE=${CMAKE_C_FLAGS_RELEASE}
-                      -DBUILD_STATIC_LIBS=ON
-                      -DCMAKE_INSTALL_PREFIX=${GFLAGS_INSTALL_DIR}
-                      -DCMAKE_POSITION_INDEPENDENT_CODE=ON
-                      -DBUILD_TESTING=OFF
-                      -DCMAKE_BUILD_TYPE=${THIRD_PARTY_BUILD_TYPE}
-                      ${EXTERNAL_OPTIONAL_ARGS}
-     CMAKE_CACHE_ARGS -DCMAKE_INSTALL_PREFIX:PATH=${GFLAGS_INSTALL_DIR}
-                      -DCMAKE_POSITION_INDEPENDENT_CODE:BOOL=ON
-                      -DCMAKE_BUILD_TYPE:STRING=${THIRD_PARTY_BUILD_TYPE}                
-      BUILD_BYPRODUCTS ${GFLAGS_LIBRARIES}
-  )
+    extern_gflags
+    ${EXTERNAL_PROJECT_LOG_ARGS}
+    URL ${GFLAGS_URL}
+    PREFIX          ${GFLAGS_PREFIX_DIR}
+    UPDATE_COMMAND  ""
+    BUILD_COMMAND   ${BUILD_COMMAND}
+    INSTALL_COMMAND ${INSTALL_COMMAND}
+    CMAKE_ARGS      -DCMAKE_TOOLCHAIN_FILE=${CMAKE_TOOLCHAIN_FILE}
+                    -DANDROID_ABI=${ANDROID_ABI}
+                    -DANDROID_NDK=${ANDROID_NDK}
+                    -DANDROID_PLATFORM=${ANDROID_PLATFORM}
+                    -DANDROID_STL=c++_static
+                    -DANDROID_TOOLCHAIN=${ANDROID_TOOLCHAIN}
+                    -DCMAKE_CXX_FLAGS=${CMAKE_CXX_FLAGS}
+                    -DCMAKE_CXX_FLAGS_RELEASE=${CMAKE_CXX_FLAGS_RELEASE}
+                    -DCMAKE_CXX_FLAGS_DEBUG=${CMAKE_CXX_FLAGS_DEBUG}
+                    -DCMAKE_C_FLAGS=${CMAKE_C_FLAGS}
+                    -DCMAKE_C_FLAGS_DEBUG=${CMAKE_C_FLAGS_DEBUG}
+                    -DCMAKE_C_FLAGS_RELEASE=${CMAKE_C_FLAGS_RELEASE}
+                    -DBUILD_STATIC_LIBS=ON
+                    -DCMAKE_INSTALL_PREFIX=${GFLAGS_INSTALL_DIR}
+                    -DCMAKE_POSITION_INDEPENDENT_CODE=ON
+                    -DBUILD_TESTING=OFF
+                    -DCMAKE_BUILD_TYPE=${THIRD_PARTY_BUILD_TYPE}
+                    ${EXTERNAL_OPTIONAL_ARGS}
+   CMAKE_CACHE_ARGS -DCMAKE_INSTALL_PREFIX:PATH=${GFLAGS_INSTALL_DIR}
+                    -DCMAKE_POSITION_INDEPENDENT_CODE:BOOL=ON
+                    -DCMAKE_BUILD_TYPE:STRING=${THIRD_PARTY_BUILD_TYPE}                
+    BUILD_BYPRODUCTS ${GFLAGS_LIBRARIES}
+)
 else()
   ExternalProject_Add(
       extern_gflags
       ${EXTERNAL_PROJECT_LOG_ARGS}
-      ${SHALLOW_CLONE}
-      GIT_REPOSITORY  ${GFLAGS_REPOSITORY}
-      GIT_TAG         ${GFLAGS_TAG}
+      URL ${GFLAGS_URL}
       PREFIX          ${GFLAGS_PREFIX_DIR}
       UPDATE_COMMAND  ""
       BUILD_COMMAND   ${BUILD_COMMAND}

From 3db057f918e952bd6497e7ed82f56a597522574b Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 16:45:46 +0800
Subject: [PATCH 51/77] =?UTF-8?q?Update=20=E6=8A=A5=E5=91=8Aissue.md?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .github/ISSUE_TEMPLATE/报告issue.md | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/.github/ISSUE_TEMPLATE/报告issue.md b/.github/ISSUE_TEMPLATE/报告issue.md
index 7cc400ace..a5d48a530 100644
--- a/.github/ISSUE_TEMPLATE/报告issue.md
+++ b/.github/ISSUE_TEMPLATE/报告issue.md
@@ -27,5 +27,7 @@ assignees: ''
 
 
 *********************************************
-请按照此issue模板进行提问，这会大大减少工程师与你确认使用环境，编译过程中的基础信息时间
+开源不易，工程师每天有大量研发工作，请直接按此issue模版进行提问
+
+这会大大减少工程师与你确认使用环境，编译过程中的基础信息时间
 *********************************************

From e7c244054bc624999e2cc5b02b75417ad4ba2919 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 16:46:28 +0800
Subject: [PATCH 52/77] =?UTF-8?q?Update=20=E6=8A=A5=E5=91=8Aissue.md?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .github/ISSUE_TEMPLATE/报告issue.md | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/.github/ISSUE_TEMPLATE/报告issue.md b/.github/ISSUE_TEMPLATE/报告issue.md
index a5d48a530..be93cd251 100644
--- a/.github/ISSUE_TEMPLATE/报告issue.md
+++ b/.github/ISSUE_TEMPLATE/报告issue.md
@@ -7,6 +7,12 @@ assignees: ''
 
 ---
 
+*********************************************
+开源不易，工程师每天有大量研发工作，请直接按此issue模版进行提问
+
+这会大大减少工程师与你确认使用环境，编译过程中的基础信息时间
+*********************************************
+
 ## 环境
 
 - FastDeploy版本： 说明具体的版本，如fastdeploy-linux-gpu-0.8.0

From 376fdbfe2c40d966416638dfa30a6bb092468461 Mon Sep 17 00:00:00 2001
From: huangjianhui <852142024@qq.com>
Date: Wed, 14 Dec 2022 17:25:58 +0800
Subject: [PATCH 53/77] [Other] Update old Api to new ones (#861)

* Update keypointdetection result docs

* Update im.copy() to im in examples

* Update new Api, fastdeploy::vision::Visualize to fastdeploy::vision

* Update SwapBackgroundSegmentation && SwapBackgroundMatting to SwapBackground

* Update README_CN.md

* Update README_CN.md
---
 README_CN.md                                      |  2 +-
 .../vision/detection/nanodet_plus/cpp/infer.cc    |  9 +++------
 .../vision/detection/scaledyolov4/cpp/infer.cc    |  9 +++------
 examples/vision/detection/yolor/cpp/infer.cc      |  9 +++------
 examples/vision/detection/yolov5/cpp/infer.cc     |  9 +++------
 .../vision/detection/yolov5/quantize/cpp/infer.cc |  3 +--
 examples/vision/detection/yolov5lite/cpp/infer.cc |  9 +++------
 examples/vision/detection/yolov6/cpp/infer.cc     |  9 +++------
 .../vision/detection/yolov6/quantize/cpp/infer.cc |  3 +--
 examples/vision/detection/yolov7/cpp/infer.cc     |  9 +++------
 .../vision/detection/yolov7/quantize/cpp/infer.cc |  3 +--
 .../detection/yolov7end2end_ort/cpp/infer.cc      |  9 +++------
 .../detection/yolov7end2end_trt/cpp/infer.cc      | 11 ++++-------
 examples/vision/detection/yolox/cpp/infer.cc      |  9 +++------
 examples/vision/facedet/retinaface/cpp/infer.cc   |  9 +++------
 examples/vision/facedet/scrfd/cpp/infer.cc        |  9 +++------
 examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc |  2 +-
 examples/vision/facedet/ultraface/cpp/infer.cc    |  9 +++------
 examples/vision/facedet/yolov5face/cpp/infer.cc   |  9 +++------
 examples/vision/matting/modnet/cpp/infer.cc       | 15 ++++++---------
 examples/vision/matting/modnet/python/infer.py    |  2 +-
 examples/vision/matting/ppmatting/cpp/infer.cc    | 15 ++++++---------
 examples/vision/matting/ppmatting/python/infer.py |  2 +-
 examples/vision/matting/rvm/python/infer.py       |  4 ++--
 24 files changed, 64 insertions(+), 115 deletions(-)

diff --git a/README_CN.md b/README_CN.md
index 28ef9f0b4..9cb3ecf6c 100755
--- a/README_CN.md
+++ b/README_CN.md
@@ -164,7 +164,7 @@ int main(int argc, char* argv[]) {
   vision::DetectionResult res;
   model.Predict(im, &res);
 
-  auto vis_im = vision::Visualize::VisDetection(im, res, 0.5);
+  auto vis_im = vision::VisDetection(im, res, 0.5);
   cv::imwrite("vis_image.jpg", vis_im);
   return 0;
 }
diff --git a/examples/vision/detection/nanodet_plus/cpp/infer.cc b/examples/vision/detection/nanodet_plus/cpp/infer.cc
index 8443639cc..ec0bbee98 100644
--- a/examples/vision/detection/nanodet_plus/cpp/infer.cc
+++ b/examples/vision/detection/nanodet_plus/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -30,7 +29,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
     return;
   }
   std::cout << res.Str() << std::endl;
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -73,7 +71,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -82,7 +79,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/scaledyolov4/cpp/infer.cc b/examples/vision/detection/scaledyolov4/cpp/infer.cc
index 7d912b223..683156cc9 100644
--- a/examples/vision/detection/scaledyolov4/cpp/infer.cc
+++ b/examples/vision/detection/scaledyolov4/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -47,7 +46,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -56,7 +54,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -74,7 +72,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -83,7 +80,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolor/cpp/infer.cc b/examples/vision/detection/yolor/cpp/infer.cc
index 0fe8913d4..bacc18b40 100644
--- a/examples/vision/detection/yolor/cpp/infer.cc
+++ b/examples/vision/detection/yolor/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov5/cpp/infer.cc b/examples/vision/detection/yolov5/cpp/infer.cc
index a7ac1fe81..1c3907918 100644
--- a/examples/vision/detection/yolov5/cpp/infer.cc
+++ b/examples/vision/detection/yolov5/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov5/quantize/cpp/infer.cc b/examples/vision/detection/yolov5/quantize/cpp/infer.cc
index e429b2aad..1addf1507 100644
--- a/examples/vision/detection/yolov5/quantize/cpp/infer.cc
+++ b/examples/vision/detection/yolov5/quantize/cpp/infer.cc
@@ -29,7 +29,6 @@ void InitAndInfer(const std::string& model_dir, const std::string& image_file,
   assert(model.Initialized());
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -39,7 +38,7 @@ void InitAndInfer(const std::string& model_dir, const std::string& image_file,
 
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov5lite/cpp/infer.cc b/examples/vision/detection/yolov5lite/cpp/infer.cc
index ac32bca93..0a3f7b81b 100644
--- a/examples/vision/detection/yolov5lite/cpp/infer.cc
+++ b/examples/vision/detection/yolov5lite/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -47,7 +46,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -56,7 +54,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -74,7 +72,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -83,7 +80,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov6/cpp/infer.cc b/examples/vision/detection/yolov6/cpp/infer.cc
index 72b2e7bed..dbca64f40 100644
--- a/examples/vision/detection/yolov6/cpp/infer.cc
+++ b/examples/vision/detection/yolov6/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov6/quantize/cpp/infer.cc b/examples/vision/detection/yolov6/quantize/cpp/infer.cc
index b40200962..adda977f3 100644
--- a/examples/vision/detection/yolov6/quantize/cpp/infer.cc
+++ b/examples/vision/detection/yolov6/quantize/cpp/infer.cc
@@ -29,7 +29,6 @@ void InitAndInfer(const std::string& model_dir, const std::string& image_file,
   assert(model.Initialized());
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -39,7 +38,7 @@ void InitAndInfer(const std::string& model_dir, const std::string& image_file,
 
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov7/cpp/infer.cc b/examples/vision/detection/yolov7/cpp/infer.cc
index cf79a16ad..5fd848b8e 100644
--- a/examples/vision/detection/yolov7/cpp/infer.cc
+++ b/examples/vision/detection/yolov7/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov7/quantize/cpp/infer.cc b/examples/vision/detection/yolov7/quantize/cpp/infer.cc
index 0eda80b6c..9ae42b582 100644
--- a/examples/vision/detection/yolov7/quantize/cpp/infer.cc
+++ b/examples/vision/detection/yolov7/quantize/cpp/infer.cc
@@ -29,7 +29,6 @@ void InitAndInfer(const std::string& model_dir, const std::string& image_file,
   assert(model.Initialized());
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -39,7 +38,7 @@ void InitAndInfer(const std::string& model_dir, const std::string& image_file,
 
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov7end2end_ort/cpp/infer.cc b/examples/vision/detection/yolov7end2end_ort/cpp/infer.cc
index a0e70544a..5c9df2816 100644
--- a/examples/vision/detection/yolov7end2end_ort/cpp/infer.cc
+++ b/examples/vision/detection/yolov7end2end_ort/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -47,7 +46,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -56,7 +54,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -74,7 +72,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -83,7 +80,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/detection/yolov7end2end_trt/cpp/infer.cc b/examples/vision/detection/yolov7end2end_trt/cpp/infer.cc
index 1c7a17d37..4f7a2f791 100644
--- a/examples/vision/detection/yolov7end2end_trt/cpp/infer.cc
+++ b/examples/vision/detection/yolov7end2end_trt/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -47,7 +46,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -56,7 +54,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -74,7 +72,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -83,7 +80,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -107,4 +104,4 @@ int main(int argc, char* argv[]) {
     TrtInfer(argv[1], argv[2]);
   }
   return 0;
-}
\ No newline at end of file
+}
diff --git a/examples/vision/detection/yolox/cpp/infer.cc b/examples/vision/detection/yolox/cpp/infer.cc
index 2eeaccbf8..836ab7e63 100644
--- a/examples/vision/detection/yolox/cpp/infer.cc
+++ b/examples/vision/detection/yolox/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::DetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/facedet/retinaface/cpp/infer.cc b/examples/vision/facedet/retinaface/cpp/infer.cc
index a1fd27b6e..f125e4ba7 100644
--- a/examples/vision/facedet/retinaface/cpp/infer.cc
+++ b/examples/vision/facedet/retinaface/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/facedet/scrfd/cpp/infer.cc b/examples/vision/facedet/scrfd/cpp/infer.cc
index c804218ee..c09403741 100644
--- a/examples/vision/facedet/scrfd/cpp/infer.cc
+++ b/examples/vision/facedet/scrfd/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc b/examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc
index 4ac3496f5..e009d2ead 100644
--- a/examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc
+++ b/examples/vision/facedet/scrfd/rknpu2/cpp/infer.cc
@@ -58,7 +58,7 @@ void RKNPU2Infer(const std::string& model_dir, const std::string& image_file) {
     std::cerr << "Failed to predict." << std::endl;
     return;
   }
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   tc.End();
   tc.PrintInfo("SCRFD in RKNN");
 
diff --git a/examples/vision/facedet/ultraface/cpp/infer.cc b/examples/vision/facedet/ultraface/cpp/infer.cc
index b45bb3b0b..b50674e1d 100644
--- a/examples/vision/facedet/ultraface/cpp/infer.cc
+++ b/examples/vision/facedet/ultraface/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/facedet/yolov5face/cpp/infer.cc b/examples/vision/facedet/yolov5face/cpp/infer.cc
index 418834e1e..ecdcfcd0c 100644
--- a/examples/vision/facedet/yolov5face/cpp/infer.cc
+++ b/examples/vision/facedet/yolov5face/cpp/infer.cc
@@ -22,7 +22,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -31,7 +30,7 @@ void CpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -46,7 +45,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -55,7 +53,7 @@ void GpuInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
@@ -72,7 +70,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
 
   fastdeploy::vision::FaceDetectionResult res;
   if (!model.Predict(&im, &res)) {
@@ -81,7 +78,7 @@ void TrtInfer(const std::string& model_file, const std::string& image_file) {
   }
   std::cout << res.Str() << std::endl;
 
-  auto vis_im = fastdeploy::vision::Visualize::VisFaceDetection(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/examples/vision/matting/modnet/cpp/infer.cc b/examples/vision/matting/modnet/cpp/infer.cc
index fe1ebc910..aa280eddd 100644
--- a/examples/vision/matting/modnet/cpp/infer.cc
+++ b/examples/vision/matting/modnet/cpp/infer.cc
@@ -23,7 +23,6 @@ void CpuInfer(const std::string& model_file, const std::string& image_file,
   }
   model.size = {256, 256};
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
   cv::Mat bg = cv::imread(background_file);
 
   fastdeploy::vision::MattingResult res;
@@ -32,9 +31,9 @@ void CpuInfer(const std::string& model_file, const std::string& image_file,
     return;
   }
 
-  auto vis_im = fastdeploy::vision::VisMatting(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisMatting(im, res);
   auto vis_im_with_bg =
-      fastdeploy::vision::Visualize::SwapBackgroundMatting(im_bak, bg, res);
+      fastdeploy::vision::SwapBackground(im, bg, res);
   cv::imwrite("visualized_result.jpg", vis_im_with_bg);
   cv::imwrite("visualized_result_fg.jpg", vis_im);
   std::cout << "Visualized result save in ./visualized_result_replaced_bg.jpg "
@@ -54,7 +53,6 @@ void GpuInfer(const std::string& model_file, const std::string& image_file,
   model.size = {256, 256};
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
   cv::Mat bg = cv::imread(background_file);
 
   fastdeploy::vision::MattingResult res;
@@ -63,9 +61,9 @@ void GpuInfer(const std::string& model_file, const std::string& image_file,
     return;
   }
 
-  auto vis_im = fastdeploy::vision::VisMatting(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisMatting(im, res);
   auto vis_im_with_bg =
-      fastdeploy::vision::Visualize::SwapBackgroundMatting(im_bak, bg, res);
+      fastdeploy::vision::SwapBackground(im, bg, res);
   cv::imwrite("visualized_result.jpg", vis_im_with_bg);
   cv::imwrite("visualized_result_fg.jpg", vis_im);
   std::cout << "Visualized result save in ./visualized_result_replaced_bg.jpg "
@@ -86,7 +84,6 @@ void TrtInfer(const std::string& model_file, const std::string& image_file,
   }
   model.size = {256, 256};
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
   cv::Mat bg = cv::imread(background_file);
 
   fastdeploy::vision::MattingResult res;
@@ -95,9 +92,9 @@ void TrtInfer(const std::string& model_file, const std::string& image_file,
     return;
   }
 
-  auto vis_im = fastdeploy::vision::VisMatting(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisMatting(im, res);
   auto vis_im_with_bg =
-      fastdeploy::vision::Visualize::SwapBackgroundMatting(im_bak, bg, res);
+      fastdeploy::vision::SwapBackground(im, bg, res);
   cv::imwrite("visualized_result.jpg", vis_im_with_bg);
   cv::imwrite("visualized_result_fg.jpg", vis_im);
   std::cout << "Visualized result save in ./visualized_result_replaced_bg.jpg "
diff --git a/examples/vision/matting/modnet/python/infer.py b/examples/vision/matting/modnet/python/infer.py
index abb9be037..37c749010 100644
--- a/examples/vision/matting/modnet/python/infer.py
+++ b/examples/vision/matting/modnet/python/infer.py
@@ -56,7 +56,7 @@ result = model.predict(im)
 print(result)
 # 可视化结果
 vis_im = fd.vision.vis_matting_alpha(im, result)
-vis_im_with_bg = fd.vision.swap_background_matting(im, bg, result)
+vis_im_with_bg = fd.vision.swap_background(im, bg, result)
 cv2.imwrite("visualized_result_fg.jpg", vis_im)
 cv2.imwrite("visualized_result_replaced_bg.jpg", vis_im_with_bg)
 print(
diff --git a/examples/vision/matting/ppmatting/cpp/infer.cc b/examples/vision/matting/ppmatting/cpp/infer.cc
index 304e4239a..2acb2a8ca 100644
--- a/examples/vision/matting/ppmatting/cpp/infer.cc
+++ b/examples/vision/matting/ppmatting/cpp/infer.cc
@@ -35,16 +35,15 @@ void CpuInfer(const std::string& model_dir, const std::string& image_file,
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
   cv::Mat bg = cv::imread(background_file);
   fastdeploy::vision::MattingResult res;
   if (!model.Predict(&im, &res)) {
     std::cerr << "Failed to predict." << std::endl;
     return;
   }
-  auto vis_im = fastdeploy::vision::VisMatting(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisMatting(im, res);
   auto vis_im_with_bg =
-      fastdeploy::vision::Visualize::SwapBackgroundMatting(im_bak, bg, res);
+      fastdeploy::vision::SwapBackground(im, bg, res);
   cv::imwrite("visualized_result.jpg", vis_im_with_bg);
   cv::imwrite("visualized_result_fg.jpg", vis_im);
   std::cout << "Visualized result save in ./visualized_result_replaced_bg.jpg "
@@ -69,16 +68,15 @@ void GpuInfer(const std::string& model_dir, const std::string& image_file,
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
   cv::Mat bg = cv::imread(background_file);
   fastdeploy::vision::MattingResult res;
   if (!model.Predict(&im, &res)) {
     std::cerr << "Failed to predict." << std::endl;
     return;
   }
-  auto vis_im = fastdeploy::vision::VisMatting(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisMatting(im, res);
   auto vis_im_with_bg =
-      fastdeploy::vision::Visualize::SwapBackgroundMatting(im_bak, bg, res);
+      fastdeploy::vision::SwapBackground(im, bg, res);
   cv::imwrite("visualized_result.jpg", vis_im_with_bg);
   cv::imwrite("visualized_result_fg.jpg", vis_im);
   std::cout << "Visualized result save in ./visualized_result_replaced_bg.jpg "
@@ -104,16 +102,15 @@ void TrtInfer(const std::string& model_dir, const std::string& image_file,
   }
 
   auto im = cv::imread(image_file);
-  auto im_bak = im.clone();
   cv::Mat bg = cv::imread(background_file);
   fastdeploy::vision::MattingResult res;
   if (!model.Predict(&im, &res)) {
     std::cerr << "Failed to predict." << std::endl;
     return;
   }
-  auto vis_im = fastdeploy::vision::VisMatting(im_bak, res);
+  auto vis_im = fastdeploy::vision::VisMatting(im, res);
   auto vis_im_with_bg =
-      fastdeploy::vision::Visualize::SwapBackgroundMatting(im_bak, bg, res);
+      fastdeploy::vision::SwapBackground(im, bg, res);
   cv::imwrite("visualized_result.jpg", vis_im_with_bg);
   cv::imwrite("visualized_result_fg.jpg", vis_im);
   std::cout << "Visualized result save in ./visualized_result_replaced_bg.jpg "
diff --git a/examples/vision/matting/ppmatting/python/infer.py b/examples/vision/matting/ppmatting/python/infer.py
index 32a81eca7..89913cd11 100644
--- a/examples/vision/matting/ppmatting/python/infer.py
+++ b/examples/vision/matting/ppmatting/python/infer.py
@@ -60,7 +60,7 @@ result = model.predict(im)
 print(result)
 # 可视化结果
 vis_im = fd.vision.vis_matting(im, result)
-vis_im_with_bg = fd.vision.swap_background_matting(im, bg, result)
+vis_im_with_bg = fd.vision.swap_background(im, bg, result)
 cv2.imwrite("visualized_result_fg.jpg", vis_im)
 cv2.imwrite("visualized_result_replaced_bg.jpg", vis_im_with_bg)
 print(
diff --git a/examples/vision/matting/rvm/python/infer.py b/examples/vision/matting/rvm/python/infer.py
index fcde64fb2..0e9eb6b21 100755
--- a/examples/vision/matting/rvm/python/infer.py
+++ b/examples/vision/matting/rvm/python/infer.py
@@ -86,7 +86,7 @@ if args.video is not None:
             break
         result = model.predict(frame)
         vis_im = fd.vision.vis_matting(frame, result)
-        vis_im_with_bg = fd.vision.swap_background_matting(frame, bg, result)
+        vis_im_with_bg = fd.vision.swap_background(frame, bg, result)
         alpha.write(vis_im)
         composition.write(vis_im_with_bg)
         cv2.waitKey(30)
@@ -104,7 +104,7 @@ if args.image is not None:
     print(result)
     # 可视化结果
     vis_im = fd.vision.vis_matting(im, result)
-    vis_im_with_bg = fd.vision.swap_background_matting(im, bg, result)
+    vis_im_with_bg = fd.vision.swap_background(im, bg, result)
     cv2.imwrite("visualized_result_fg.jpg", vis_im)
     cv2.imwrite("visualized_result_replaced_bg.jpg", vis_im_with_bg)
     print(

From 0cdaef890f27ce6555955461c6cd8f50ffe0347e Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 18:54:50 +0800
Subject: [PATCH 54/77] Update use_sdk_on_windows.md

---
 docs/cn/faq/use_sdk_on_windows.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/cn/faq/use_sdk_on_windows.md b/docs/cn/faq/use_sdk_on_windows.md
index 7209d50bb..0683e8d04 100644
--- a/docs/cn/faq/use_sdk_on_windows.md
+++ b/docs/cn/faq/use_sdk_on_windows.md
@@ -1,3 +1,5 @@
+[English](../../en/faq/use_sdk_on_windows.md) | 中文
+
 # 在 Windows 使用 FastDeploy C++ SDK
 
 ## 目录

From 41d94a355baa91052d25b205c11a52f2cf5f4c6a Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 18:55:15 +0800
Subject: [PATCH 55/77] Update use_sdk_on_windows.md

---
 docs/en/faq/use_sdk_on_windows.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/en/faq/use_sdk_on_windows.md b/docs/en/faq/use_sdk_on_windows.md
index 367f6e1df..7826d2e42 100644
--- a/docs/en/faq/use_sdk_on_windows.md
+++ b/docs/en/faq/use_sdk_on_windows.md
@@ -1,3 +1,5 @@
+English | [中文](../../en/faq/use_sdk_on_windows.md)
+
 # Using the FastDeploy C++ SDK on Windows Platform
 
 ## Contents

From f852d515e06f865ba6319e5716f64bd96ce07348 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 18:55:37 +0800
Subject: [PATCH 56/77] Update use_sdk_on_windows.md

---
 docs/en/faq/use_sdk_on_windows.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/faq/use_sdk_on_windows.md b/docs/en/faq/use_sdk_on_windows.md
index 7826d2e42..315e5ef6a 100644
--- a/docs/en/faq/use_sdk_on_windows.md
+++ b/docs/en/faq/use_sdk_on_windows.md
@@ -1,4 +1,4 @@
-English | [中文](../../en/faq/use_sdk_on_windows.md)
+English | [中文](../../cn/faq/use_sdk_on_windows.md)
 
 # Using the FastDeploy C++ SDK on Windows Platform
 

From fb56700fa625dc0eb92bdf47d962605444e3497a Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 18:57:56 +0800
Subject: [PATCH 57/77] Update use_sdk_on_linux.md

---
 docs/en/faq/use_sdk_on_linux.md | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/docs/en/faq/use_sdk_on_linux.md b/docs/en/faq/use_sdk_on_linux.md
index 4dcffb3a4..2c1cf551d 100644
--- a/docs/en/faq/use_sdk_on_linux.md
+++ b/docs/en/faq/use_sdk_on_linux.md
@@ -1,3 +1,5 @@
+English | [中文](../../cn/faq/use_sdk_on_linux.md)
+
 # C++ Deployment on Linux
 
 1. After compilation, and execute the binary file, throw error `error while loading shared libraries`
@@ -13,4 +15,4 @@ FastDeploy provides a shell scripts to help export the libraries path to `LD_LIB
 source /Downloads/fastdeploy-linux-x64-1.0.0/fastdeploy_init.sh
 ```
 
-And now you can execute the binary file again. 
\ No newline at end of file
+And now you can execute the binary file again. 

From 136cd47e02aa041e8ce4cbdd938a905f1a1f3bfa Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 18:58:33 +0800
Subject: [PATCH 58/77] Update use_sdk_on_linux.md

---
 docs/cn/faq/use_sdk_on_linux.md | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docs/cn/faq/use_sdk_on_linux.md b/docs/cn/faq/use_sdk_on_linux.md
index aba472ecc..0ceb5ca0c 100644
--- a/docs/cn/faq/use_sdk_on_linux.md
+++ b/docs/cn/faq/use_sdk_on_linux.md
@@ -1,3 +1,6 @@
+[English](../../en/faq/use_sdk_on_linux.md) | 中文
+
+
 # Linux上C++部署
 
 1. 编译完成运行，提示找不到.so文件
@@ -10,4 +13,4 @@
 source /Downloads/fastdeploy-linux-x64-1.0.0/fastdeploy_init.sh
 ```
 
-再重新执行即可。 注意此命令执行后仅在当前的命令环境中生效（切换一个新的终端窗口，或关闭窗口重新打开后会无效），如若需要在系统中持续生效，可将这些环境变量加入到`~/.bashrc`文件中。
\ No newline at end of file
+再重新执行即可。 注意此命令执行后仅在当前的命令环境中生效（切换一个新的终端窗口，或关闭窗口重新打开后会无效），如若需要在系统中持续生效，可将这些环境变量加入到`~/.bashrc`文件中。

From a5d865625f49ebb98e3d5d6fd04fbb6c2ad13b46 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 18:59:42 +0800
Subject: [PATCH 59/77] Update use_sdk_on_linux.md

---
 docs/en/faq/use_sdk_on_linux.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/faq/use_sdk_on_linux.md b/docs/en/faq/use_sdk_on_linux.md
index 2c1cf551d..653389f43 100644
--- a/docs/en/faq/use_sdk_on_linux.md
+++ b/docs/en/faq/use_sdk_on_linux.md
@@ -9,7 +9,7 @@ When we execute the binary file, it requires the dependent libraries can be foun
 ./infer_ppyoloe_demo: error while loading shared libraries: libonnxruntime.so.1.12.0: cannot open shared object file: No such file or directory
 ```
 
-FastDeploy provides a shell scripts to help export the libraries path to `LD_LIBRARY_PATH`, execute the follwing command
+FastDeploy provides a shell scripts to help export the libraries path to `LD_LIBRARY_PATH`, execute the following command
 
 ```
 source /Downloads/fastdeploy-linux-x64-1.0.0/fastdeploy_init.sh

From ce4867d14e7abf8516262ef6066661da6f552d74 Mon Sep 17 00:00:00 2001
From: CoolCola <49013063+CoolKbh@users.noreply.github.com>
Date: Wed, 14 Dec 2022 19:14:43 +0800
Subject: [PATCH 60/77] [Model] Support YOLOv7-face Model (#651)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* 测试

* delete test

* add yolov7-face

* fit vision.h

* add yolov7-face test

* fit: yolov7-face infer.cc

* fit

* fit Yolov7-face Cmakelist

* fit yolov7Face.cc

* add yolov7-face pybind

* add yolov7-face python infer

* feat yolov7-face pybind

* feat yolov7-face format error

* feat yolov7face_pybind error

* feat add yolov7face-pybind to facedet-pybind

* same as before

* same sa before

* feat __init__.py

* add yolov7face.py

* feat yolov7face.h ignore ","

* feat .py

* fit yolov7face.py

* add yolov7face test teadme file

* add test file

* fit postprocess

* delete remain annotation

* fit preview

* fit yolov7facepreprocessor

* fomat code

* fomat code

* fomat code

* fit format error and confthreshold and nmsthres

* fit confthreshold and nmsthres

* fit test-yolov7-face

* fit test_yolov7face

* fit review

* fit ci error

Co-authored-by: kongbohua <kongbh2022@stu.pku.edu.cn>
Co-authored-by: CoolCola <49013063+kongbohua@users.noreply.github.com>
---
 .../facedet/yolov7face/cpp/CMakeLists.txt     |  14 ++
 .../vision/facedet/yolov7face/cpp/README.md   |  90 ++++++++++
 .../vision/facedet/yolov7face/cpp/infer.cc    | 105 +++++++++++
 .../facedet/yolov7face/python/README.md       |  87 +++++++++
 .../vision/facedet/yolov7face/python/infer.py |  51 ++++++
 fastdeploy/vision.h                           |   1 +
 fastdeploy/vision/facedet/facedet_pybind.cc   |   2 +
 .../facedet/yolov7-face/postprocessor.cc      | 101 +++++++++++
 .../facedet/yolov7-face/postprocessor.h       |  68 +++++++
 .../facedet/yolov7-face/preprocessor.cc       | 120 +++++++++++++
 .../vision/facedet/yolov7-face/preprocessor.h | 100 +++++++++++
 .../vision/facedet/yolov7-face/yolov7face.cc  |  88 ++++++++++
 .../vision/facedet/yolov7-face/yolov7face.h   |  81 +++++++++
 .../facedet/yolov7-face/yolov7face_pybind.cc  |  87 +++++++++
 python/fastdeploy/vision/facedet/__init__.py  |   1 +
 .../vision/facedet/contrib/yolov7face.py      | 166 ++++++++++++++++++
 tests/models/test_yolov7face.py               | 142 +++++++++++++++
 17 files changed, 1304 insertions(+)
 create mode 100644 examples/vision/facedet/yolov7face/cpp/CMakeLists.txt
 create mode 100644 examples/vision/facedet/yolov7face/cpp/README.md
 create mode 100644 examples/vision/facedet/yolov7face/cpp/infer.cc
 create mode 100644 examples/vision/facedet/yolov7face/python/README.md
 create mode 100644 examples/vision/facedet/yolov7face/python/infer.py
 create mode 100644 fastdeploy/vision/facedet/yolov7-face/postprocessor.cc
 create mode 100644 fastdeploy/vision/facedet/yolov7-face/postprocessor.h
 create mode 100644 fastdeploy/vision/facedet/yolov7-face/preprocessor.cc
 create mode 100644 fastdeploy/vision/facedet/yolov7-face/preprocessor.h
 create mode 100644 fastdeploy/vision/facedet/yolov7-face/yolov7face.cc
 create mode 100644 fastdeploy/vision/facedet/yolov7-face/yolov7face.h
 create mode 100644 fastdeploy/vision/facedet/yolov7-face/yolov7face_pybind.cc
 create mode 100644 python/fastdeploy/vision/facedet/contrib/yolov7face.py
 create mode 100644 tests/models/test_yolov7face.py

diff --git a/examples/vision/facedet/yolov7face/cpp/CMakeLists.txt b/examples/vision/facedet/yolov7face/cpp/CMakeLists.txt
new file mode 100644
index 000000000..4ec242a44
--- /dev/null
+++ b/examples/vision/facedet/yolov7face/cpp/CMakeLists.txt
@@ -0,0 +1,14 @@
+PROJECT(infer_demo C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+# Specifies the path to the fastdeploy library after you have downloaded it
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+
+include(../../../../../FastDeploy.cmake)
+
+# Add the FastDeploy dependency header
+include_directories(${FASTDEPLOY_INCS})
+
+add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
+# Add the FastDeploy library dependency
+target_link_libraries(infer_demo ${FASTDEPLOY_LIBS})
diff --git a/examples/vision/facedet/yolov7face/cpp/README.md b/examples/vision/facedet/yolov7face/cpp/README.md
new file mode 100644
index 000000000..3b68ff41c
--- /dev/null
+++ b/examples/vision/facedet/yolov7face/cpp/README.md
@@ -0,0 +1,90 @@
+# YOLOv7Face C++部署示例
+
+本目录下提供`infer.cc`快速完成YOLOv7Face在CPU/GPU，以及GPU上通过TensorRT加速部署的示例。
+
+在部署前，需确认以下两个步骤
+
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
+- 2. 根据开发环境，下载预编译部署库和samples代码，参考[FastDeploy预编译库](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+以Linux上CPU推理为例，在本目录执行如下命令即可完成编译测试
+
+```bash
+mkdir build
+cd build
+# 下载FastDeploy预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
+wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz # x.x.x > 1.0.2
+tar xvf fastdeploy-linux-x64-x.x.x.tgz # x.x.x > 1.0.2
+cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x # x.x.x > 1.0.2
+make -j
+
+#下载官方转换好的YOLOv7Face模型文件和测试图片
+wget https://raw.githubusercontent.com/DefTruth/lite.ai.toolkit/main/examples/lite/resources/test_lite_face_detector_3.jpg
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov7-lite-e.onnx
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov7-tiny-face.onnx
+
+#使用yolov7-tiny-face.onnx模型
+# CPU推理
+./infer_demo yolov7-tiny-face.onnx test_lite_face_detector_3.jpg 0
+# GPU推理
+./infer_demo yolov7-tiny-face.onnx test_lite_face_detector_3.jpg 1
+# GPU上TensorRT推理
+./infer_demo yolov7-tiny-face.onnx test_lite_face_detector_3.jpg 2
+
+#使用yolov7-lite-e.onnx模型
+# CPU推理
+./infer_demo yolov7-lite-e.onnx test_lite_face_detector_3.jpg 0
+# GPU推理
+./infer_demo yolov7-lite-e.onnx test_lite_face_detector_3.jpg 1
+# GPU上TensorRT推理
+./infer_demo yolov7-lite-e.onnx test_lite_face_detector_3.jpg 2
+```
+
+运行完成可视化结果如下图所示
+
+<img width="640" src="https://user-images.githubusercontent.com/49013063/206170111-843febb6-67d6-4c46-a121-d87d003bba21.jpg">
+
+以上命令只适用于Linux或MacOS, Windows下SDK的使用方式请参考:  
+- [如何在Windows中使用FastDeploy C++ SDK](../../../../../docs/cn/faq/use_sdk_on_windows.md)
+
+## YOLOv7Face C++接口
+
+### YOLOv7Face类
+
+```c++
+fastdeploy::vision::facedet::YOLOv7Face(
+        const string& model_file,
+        const string& params_file = "",
+        const RuntimeOption& runtime_option = RuntimeOption(),
+        const ModelFormat& model_format = ModelFormat::ONNX)
+```
+
+YOLOv7Face模型加载和初始化，其中model_file为导出的ONNX模型格式。
+
+**参数**
+
+> * **model_file**(str): 模型文件路径
+> * **params_file**(str): 参数文件路径，当模型格式为ONNX时，此参数传入空字符串即可
+> * **runtime_option**(RuntimeOption): 后端推理配置，默认为None，即采用默认配置
+> * **model_format**(ModelFormat): 模型格式，默认为ONNX格式
+
+#### Predict函数
+
+> ```c++
+> YOLOv7Face::Predict(cv::Mat* im, FaceDetectionResult* result,
+>                 float conf_threshold = 0.3,
+>                 float nms_iou_threshold = 0.5)
+> ```
+>
+> 模型预测接口，输入图像直接输出检测结果。
+>
+> **参数**
+>
+> > * **im**: 输入图像，注意需为HWC，BGR格式
+> > * **result**: 检测结果，包括检测框，各个框的置信度, FaceDetectionResult说明参考[视觉模型预测结果](../../../../../docs/api/vision_results/)
+> > * **conf_threshold**: 检测框置信度过滤阈值
+> > * **nms_iou_threshold**: NMS处理过程中iou阈值
+
+- [模型介绍](../../)
+- [Python部署](../python)
+- [视觉模型预测结果](../../../../../docs/api/vision_results/)
diff --git a/examples/vision/facedet/yolov7face/cpp/infer.cc b/examples/vision/facedet/yolov7face/cpp/infer.cc
new file mode 100644
index 000000000..973b65be3
--- /dev/null
+++ b/examples/vision/facedet/yolov7face/cpp/infer.cc
@@ -0,0 +1,105 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+
+void CpuInfer(const std::string& model_file, const std::string& image_file) {
+  auto model = fastdeploy::vision::facedet::YOLOv7Face(model_file);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::FaceDetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void GpuInfer(const std::string& model_file, const std::string& image_file) {
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  auto model = fastdeploy::vision::facedet::YOLOv7Face(model_file, "", option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::FaceDetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void TrtInfer(const std::string& model_file, const std::string& image_file) {
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UseTrtBackend();
+  option.SetTrtInputShape("images", {1, 3, 640, 640});
+  auto model = fastdeploy::vision::facedet::YOLOv7Face(model_file, "", option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::FaceDetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisFaceDetection(im, res);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 4) {
+    std::cout << "Usage: infer_demo path/to/model path/to/image run_option, "
+                 "e.g ./infer_model yolov5s-face.onnx ./test.jpeg 0"
+              << std::endl;
+    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
+                 "with gpu; 2: run with gpu and use tensorrt backend."
+              << std::endl;
+    return -1;
+  }
+
+  if (std::atoi(argv[3]) == 0) {
+    CpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 1) {
+    GpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 2) {
+    TrtInfer(argv[1], argv[2]);
+  }
+  return 0;
+}
diff --git a/examples/vision/facedet/yolov7face/python/README.md b/examples/vision/facedet/yolov7face/python/README.md
new file mode 100644
index 000000000..0c4dd0f57
--- /dev/null
+++ b/examples/vision/facedet/yolov7face/python/README.md
@@ -0,0 +1,87 @@
+# YOLOv7Face Python部署示例
+
+在部署前，需确认以下两个步骤
+
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
+- 2. FastDeploy Python whl包安装，参考[FastDeploy Python安装](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+本目录下提供`infer.py`快速完成YOLOv7Face在CPU/GPU，以及GPU上通过TensorRT加速部署的示例。执行如下脚本即可完成
+
+```bash
+#下载部署示例代码
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd examples/vision/facedet/yolov7face/python/
+
+#下载YOLOv7Face模型文件和测试图片
+wget https://raw.githubusercontent.com/DefTruth/lite.ai.toolkit/main/examples/lite/resources/test_lite_face_detector_3.jpg
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov7-lite-e.onnx
+
+#使用yolov7-tiny-face.onnx模型
+# CPU推理
+python infer.py --model yolov7-tiny-face.onnx --image test_lite_face_detector_3.jpg --device cpu
+# GPU推理
+python infer.py --model yolov7-tiny-face.onnx --image test_lite_face_detector_3.jpg --device gpu
+# GPU上使用TensorRT推理
+python infer.py --model yolov7-tiny-face.onnx --image test_lite_face_detector_3.jpg --device gpu --use_trt True
+
+#使用yolov7-lite-e.onnx模型
+# CPU推理
+python infer.py --model yolov7-lite-e.onnx --image test_lite_face_detector_3.jpg --device cpu
+# GPU推理
+python infer.py --model yolov7-lite-e.onnx --image test_lite_face_detector_3.jpg --device gpu
+# GPU上使用TensorRT推理
+python infer.py --model yolov7-lite-e.onnx --image test_lite_face_detector_3.jpg --device gpu --use_trt True
+```
+
+运行完成可视化结果如下图所示
+
+<img width="640" src="https://user-images.githubusercontent.com/67993288/184301839-a29aefae-16c9-4196-bf9d-9c6cf694f02d.jpg">
+
+## YOLOv7Face Python接口
+
+```python
+fastdeploy.vision.facedet.YOLOv7Face(model_file, params_file=None, runtime_option=None, model_format=ModelFormat.ONNX)
+```
+
+YOLOv7Face模型加载和初始化，其中model_file为导出的ONNX模型格式
+
+**参数**
+
+> * **model_file**(str): 模型文件路径
+> * **params_file**(str): 参数文件路径，当模型格式为ONNX格式时，此参数无需设定
+> * **runtime_option**(RuntimeOption): 后端推理配置，默认为None，即采用默认配置
+> * **model_format**(ModelFormat): 模型格式，默认为ONNX
+
+### predict函数
+
+> ```python
+> YOLOv7Face.predict(image_data, conf_threshold=0.3, nms_iou_threshold=0.5)
+> ```
+>
+> 模型预测结口，输入图像直接输出检测结果。
+>
+> **参数**
+>
+> > * **image_data**(np.ndarray): 输入数据，注意需为HWC，BGR格式
+> > * **conf_threshold**(float): 检测框置信度过滤阈值
+> > * **nms_iou_threshold**(float): NMS处理过程中iou阈值
+
+> **返回**
+>
+> > 返回`fastdeploy.vision.FaceDetectionResult`结构体，结构体说明参考文档[视觉模型预测结果](../../../../../docs/api/vision_results/)
+
+### 类成员属性
+#### 预处理参数
+用户可按照自己的实际需求，修改下列预处理参数，从而影响最终的推理和部署效果
+
+> > * **size**(list[int]): 通过此参数修改预处理过程中resize的大小，包含两个整型元素，表示[width, height], 默认值为[640, 640]
+> > * **padding_value**(list[float]): 通过此参数可以修改图片在resize时候做填充(padding)的值, 包含三个浮点型元素, 分别表示三个通道的值, 默认值为[114, 114, 114]
+> > * **is_no_pad**(bool): 通过此参数让图片是否通过填充的方式进行resize, `is_no_pad=True` 表示不使用填充的方式，默认值为`is_no_pad=False`
+> > * **is_mini_pad**(bool): 通过此参数可以将resize之后图像的宽高这是为最接近`size`成员变量的值, 并且满足填充的像素大小是可以被`stride`成员变量整除的。默认值为`is_mini_pad=False`
+> > * **stride**(int): 配合`is_mini_pad`成员变量使用, 默认值为`stride=32`
+
+## 其它文档
+
+- [YOLOv7Face 模型介绍](..)
+- [YOLOv7Face C++部署](../cpp)
+- [模型预测结果说明](../../../../../docs/api/vision_results/)
diff --git a/examples/vision/facedet/yolov7face/python/infer.py b/examples/vision/facedet/yolov7face/python/infer.py
new file mode 100644
index 000000000..d06b507ee
--- /dev/null
+++ b/examples/vision/facedet/yolov7face/python/infer.py
@@ -0,0 +1,51 @@
+import fastdeploy as fd
+import cv2
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model", required=True, help="Path of yolov7face onnx model.")
+    parser.add_argument(
+        "--image", required=True, help="Path of test image file.")
+    parser.add_argument(
+        "--device",
+        type=str,
+        default='cpu',
+        help="Type of inference device, support 'cpu' or 'gpu'.")
+    parser.add_argument(
+        "--use_trt",
+        type=ast.literal_eval,
+        default=False,
+        help="Wether to use tensorrt.")
+    return parser.parse_args()
+
+
+def build_option(args):
+    option = fd.RuntimeOption()
+
+    if args.device.lower() == "gpu":
+        option.use_gpu()
+
+    if args.use_trt:
+        option.use_trt_backend()
+        option.set_trt_input_shape("images", [1, 3, 640, 640])
+    return option
+
+
+args = parse_arguments()
+
+# Configure runtime and load the model
+runtime_option = build_option(args)
+model = fd.vision.facedet.YOLOv7Face(args.model, runtime_option=runtime_option)
+
+# Predict image detection results
+im = cv2.imread(args.image)
+result = model.predict(im)
+print(result)
+# Visualization of prediction Results
+vis_im = fd.vision.vis_face_detection(im, result)
+cv2.imwrite("visualized_result.jpg", vis_im)
+print("Visualized result save in ./visualized_result.jpg")
diff --git a/fastdeploy/vision.h b/fastdeploy/vision.h
index 5ccaeb2dd..732f9e7a5 100644
--- a/fastdeploy/vision.h
+++ b/fastdeploy/vision.h
@@ -37,6 +37,7 @@
 #include "fastdeploy/vision/facedet/contrib/scrfd.h"
 #include "fastdeploy/vision/facedet/contrib/ultraface.h"
 #include "fastdeploy/vision/facedet/contrib/yolov5face.h"
+#include "fastdeploy/vision/facedet/yolov7-face/yolov7face.h"
 #include "fastdeploy/vision/faceid/contrib/adaface.h"
 #include "fastdeploy/vision/faceid/contrib/arcface.h"
 #include "fastdeploy/vision/faceid/contrib/cosface.h"
diff --git a/fastdeploy/vision/facedet/facedet_pybind.cc b/fastdeploy/vision/facedet/facedet_pybind.cc
index 3d9a812af..e5a62542d 100644
--- a/fastdeploy/vision/facedet/facedet_pybind.cc
+++ b/fastdeploy/vision/facedet/facedet_pybind.cc
@@ -19,6 +19,7 @@ namespace fastdeploy {
 void BindRetinaFace(pybind11::module& m);
 void BindUltraFace(pybind11::module& m);
 void BindYOLOv5Face(pybind11::module& m);
+void BindYOLOv7Face(pybind11::module& m);
 void BindSCRFD(pybind11::module& m);
 
 void BindFaceDet(pybind11::module& m) {
@@ -26,6 +27,7 @@ void BindFaceDet(pybind11::module& m) {
   BindRetinaFace(facedet_module);
   BindUltraFace(facedet_module);
   BindYOLOv5Face(facedet_module);
+  BindYOLOv7Face(facedet_module);
   BindSCRFD(facedet_module);
 }
 }  // namespace fastdeploy
diff --git a/fastdeploy/vision/facedet/yolov7-face/postprocessor.cc b/fastdeploy/vision/facedet/yolov7-face/postprocessor.cc
new file mode 100644
index 000000000..e2c92a6d1
--- /dev/null
+++ b/fastdeploy/vision/facedet/yolov7-face/postprocessor.cc
@@ -0,0 +1,101 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision/facedet/yolov7-face/postprocessor.h"
+#include "fastdeploy/vision/utils/utils.h"
+
+namespace fastdeploy {
+
+namespace vision {
+
+namespace facedet {
+
+Yolov7FacePostprocessor::Yolov7FacePostprocessor() {
+  conf_threshold_ = 0.5;
+  nms_threshold_ = 0.45;
+  max_wh_ = 7680.0;
+}
+
+bool Yolov7FacePostprocessor::Run(const std::vector<FDTensor>& infer_result,
+ std::vector<FaceDetectionResult>* results,
+                              const std::vector<std::map<std::string, std::array<float, 2>>>& ims_info) {
+  int batch = infer_result[0].shape[0];
+ 
+  results->resize(batch);
+
+  for (size_t bs = 0; bs < batch; ++bs) {
+    (*results)[bs].Clear();
+    (*results)[bs].Reserve(infer_result[0].shape[1]);
+    if (infer_result[0].dtype != FDDataType::FP32) {
+      FDERROR << "Only support post process with float32 data." << std::endl;
+      return false;
+    }
+    const float* data = reinterpret_cast<const float*>(infer_result[0].Data()) + bs * infer_result[0].shape[1] * infer_result[0].shape[2];
+    for (size_t i = 0; i < infer_result[0].shape[1]; ++i) {
+      int s = i * infer_result[0].shape[2];
+      float confidence = data[s + 4];
+      const float* reg_cls_ptr = data + s;
+      const float* class_score = data + s + 5;
+      confidence  *= (*class_score);
+      // filter boxes by conf_threshold
+      if (confidence <= conf_threshold_) {
+        continue;
+      }
+      float x = reg_cls_ptr[0];
+      float y = reg_cls_ptr[1];
+      float w = reg_cls_ptr[2];
+      float h = reg_cls_ptr[3];
+
+      // convert from [x, y, w, h] to [x1, y1, x2, y2]
+      (*results)[bs].boxes.emplace_back(std::array<float, 4>{
+          (x - w / 2.f), (y - h / 2.f), (x + w / 2.f), (y + h / 2.f)});
+      (*results)[bs].scores.push_back(confidence);
+    }
+
+    if ((*results)[bs].boxes.size() == 0) {
+      return true;
+    }
+  
+    utils::NMS(&((*results)[bs]), nms_threshold_);
+
+    // scale the boxes to the origin image shape
+    auto iter_out = ims_info[bs].find("output_shape");
+    auto iter_ipt = ims_info[bs].find("input_shape");
+    FDASSERT(iter_out != ims_info[bs].end() && iter_ipt != ims_info[bs].end(),
+            "Cannot find input_shape or output_shape from im_info.");
+    float out_h = iter_out->second[0];
+    float out_w = iter_out->second[1];
+    float ipt_h = iter_ipt->second[0];
+    float ipt_w = iter_ipt->second[1];
+    float scale = std::min(out_h / ipt_h, out_w / ipt_w);
+    for (size_t i = 0; i < (*results)[bs].boxes.size(); ++i) {
+      float pad_h = (out_h - ipt_h * scale) / 2;
+      float pad_w = (out_w - ipt_w * scale) / 2;
+      // clip box
+      (*results)[bs].boxes[i][0] = std::max(((*results)[bs].boxes[i][0] - pad_w) / scale, 0.0f);
+      (*results)[bs].boxes[i][1] = std::max(((*results)[bs].boxes[i][1] - pad_h) / scale, 0.0f);
+      (*results)[bs].boxes[i][2] = std::max(((*results)[bs].boxes[i][2] - pad_w) / scale, 0.0f);
+      (*results)[bs].boxes[i][3] = std::max(((*results)[bs].boxes[i][3] - pad_h) / scale, 0.0f);
+      (*results)[bs].boxes[i][0] = std::min((*results)[bs].boxes[i][0], ipt_w - 1.0f);
+      (*results)[bs].boxes[i][1] = std::min((*results)[bs].boxes[i][1], ipt_h - 1.0f);
+      (*results)[bs].boxes[i][2] = std::min((*results)[bs].boxes[i][2], ipt_w - 1.0f);
+      (*results)[bs].boxes[i][3] = std::min((*results)[bs].boxes[i][3], ipt_h - 1.0f);
+    }
+  }
+  return true;
+}
+
+}  // namespace detection
+}  // namespace vision
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/facedet/yolov7-face/postprocessor.h b/fastdeploy/vision/facedet/yolov7-face/postprocessor.h
new file mode 100644
index 000000000..4a1b0d852
--- /dev/null
+++ b/fastdeploy/vision/facedet/yolov7-face/postprocessor.h
@@ -0,0 +1,68 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+#include "fastdeploy/vision/common/processors/transform.h"
+#include "fastdeploy/vision/common/result.h"
+
+namespace fastdeploy {
+
+namespace vision {
+
+namespace facedet {
+
+class FASTDEPLOY_DECL Yolov7FacePostprocessor{
+ public:
+  /*! @brief Postprocessor object for YOLOv7Face serials model.
+   */
+  Yolov7FacePostprocessor();
+
+  /** \brief Process the result of runtime and fill to FaceDetectionResult structure
+   *
+   * \param[in] infer_result The inference result from runtime
+   * \param[in] results The output result of detection
+   * \param[in] ims_info The shape info list, record input_shape and output_shape
+   * \return true if the postprocess successed, otherwise false
+   */
+  bool Run(const std::vector<FDTensor>& infer_result,
+           std::vector<FaceDetectionResult>* results,
+           const std::vector<std::map<std::string,
+                             std::array<float, 2>>>& ims_info);
+
+  /// Set conf_threshold, default 0.5
+  void SetConfThreshold(const float& conf_threshold) {
+    conf_threshold_ = conf_threshold;
+  }
+
+  /// Get conf_threshold, default 0.5
+  float GetConfThreshold() const { return conf_threshold_; }
+
+  /// Set nms_threshold, default 0.45
+  void SetNMSThreshold(const float& nms_threshold) {
+    nms_threshold_ = nms_threshold;
+  }
+
+  /// Get nms_threshold, default 0.45
+  float GetNMSThreshold() const { return nms_threshold_; }
+
+ protected:
+  float conf_threshold_;
+  float nms_threshold_;
+  bool multi_label_;
+  float max_wh_;
+};
+
+}  // namespace facedet
+}  // namespace vision
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/facedet/yolov7-face/preprocessor.cc b/fastdeploy/vision/facedet/yolov7-face/preprocessor.cc
new file mode 100644
index 000000000..83301d76d
--- /dev/null
+++ b/fastdeploy/vision/facedet/yolov7-face/preprocessor.cc
@@ -0,0 +1,120 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision/facedet/yolov7-face/preprocessor.h"
+#include "fastdeploy/function/concat.h"
+#include "fastdeploy/vision/common/processors/mat.h"
+
+namespace fastdeploy {
+
+namespace vision {
+
+namespace facedet {
+
+Yolov7FacePreprocessor::Yolov7FacePreprocessor() {
+  size_ = {640, 640};
+  padding_color_value_ = {114.0, 114.0, 114.0};
+  is_mini_pad_ = false;
+  is_no_pad_ = false;
+  is_scale_up_ = false;
+  stride_ = 32;
+  max_wh_ = 7680.0;
+}
+
+bool Yolov7FacePreprocessor::Run(std::vector<FDMat>* images, std::vector<FDTensor>* outputs,
+                                 std::vector<std::map<std::string, std::array<float, 2>>>* ims_info) {
+  if (images->size() == 0) {
+    FDERROR << "The size of input images should be greater than 0." << std::endl;
+    return false;
+  }
+  ims_info->resize(images->size());
+  outputs->resize(1);
+  std::vector<FDTensor> tensors(images->size());
+  for (size_t i = 0; i < images->size(); i++) {
+    if (!Preprocess(&(*images)[i], &tensors[i], &(*ims_info)[i])) {
+      FDERROR << "Failed to preprocess input image." << std::endl;
+      return false;
+    }
+  }
+
+  if (tensors.size() == 1) {
+    (*outputs)[0] = std::move(tensors[0]);
+  } else {
+    function::Concat(tensors, &((*outputs)[0]), 0);
+  }
+  return true;
+}
+
+bool Yolov7FacePreprocessor::Preprocess(FDMat* mat, FDTensor* output,
+                                        std::map<std::string, std::array<float, 2>>* im_info){
+  // Record the shape of image and the shape of preprocessed image
+  (*im_info)["input_shape"] = {static_cast<float>(mat->Height()),
+                               static_cast<float>(mat->Width())};
+
+  // yolov7-face's preprocess steps
+  // 1. letterbox
+  // 2. convert_and_permute(swap_rb=true)
+  LetterBox(mat);
+  std::vector<float> alpha = {1.0f / 255.0f, 1.0f / 255.0f, 1.0f / 255.0f};
+  std::vector<float> beta = {0.0f, 0.0f, 0.0f};
+  ConvertAndPermute::Run(mat, alpha, beta, true);
+
+  // Record output shape of preprocessed image
+  (*im_info)["output_shape"] = {static_cast<float>(mat->Height()),
+                                static_cast<float>(mat->Width())};
+
+  mat->ShareWithTensor(output);
+  output->ExpandDim(0);  // reshape to n, h, w, c
+  return true;
+}
+
+void Yolov7FacePreprocessor::LetterBox(FDMat* mat) {
+  float scale =
+      std::min(size_[1] * 1.0 / mat->Height(), size_[0] * 1.0 / mat->Width()); 
+  if (!is_scale_up_) {
+    scale = std::min(scale, 1.0f);
+  }
+
+  int resize_h = int(round(mat->Height() * scale));
+  int resize_w = int(round(mat->Width() * scale));
+
+  int pad_w = size_[0] - resize_w;
+  int pad_h = size_[1] - resize_h;
+  if (is_mini_pad_) {
+    pad_h = pad_h % stride_;
+    pad_w = pad_w % stride_;
+  } else if (is_no_pad_) {
+    pad_h = 0;
+    pad_w = 0;
+    resize_h = size_[1];
+    resize_w = size_[0];
+  }
+  Resize::Run(mat, resize_w, resize_h);
+
+  if (pad_h > 0 || pad_w > 0) {
+    float half_h = pad_h * 1.0 / 2;
+    int top = int(round(half_h - 0.1));
+    int bottom = int(round(half_h + 0.1));
+    float half_w = pad_w * 1.0 / 2;
+    int left = int(round(half_w - 0.1));
+    int right = int(round(half_w + 0.1));
+    Pad::Run(mat, top, bottom, left, right, padding_color_value_);
+  }
+}
+
+}  // namespace facedet
+
+}  // namespace vision
+
+}  // namespacefastdeploy
\ No newline at end of file
diff --git a/fastdeploy/vision/facedet/yolov7-face/preprocessor.h b/fastdeploy/vision/facedet/yolov7-face/preprocessor.h
new file mode 100644
index 000000000..4bd8644b7
--- /dev/null
+++ b/fastdeploy/vision/facedet/yolov7-face/preprocessor.h
@@ -0,0 +1,100 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+#include "fastdeploy/vision/common/processors/transform.h"
+#include "fastdeploy/vision/common/result.h"
+
+namespace fastdeploy {
+
+namespace vision {
+
+namespace facedet {
+
+class FASTDEPLOY_DECL Yolov7FacePreprocessor{
+ public:
+  /** \brief Create a preprocessor instance for YOLOv7Face serials model
+   */
+  Yolov7FacePreprocessor();
+
+  /** \brief Process the input image and prepare input tensors for runtime
+   *
+   * \param[in] images The input image data list, all the elements are returned by cv::imread()
+   * \param[in] outputs The output tensors which will feed in runtime
+   * \param[in] ims_info The shape info list, record input_shape and output_shape
+   * \ret
+   */
+  bool Run(std::vector<FDMat>* images, std::vector<FDTensor>* outputs,
+           std::vector<std::map<std::string, std::array<float, 2>>>* ims_info);
+
+  /// Set target size, tuple of (width, height), default size = {640, 640}
+  void SetSize(const std::vector<int>& size) { size_ = size; }
+
+  /// Get target size, tuple of (width, height), default size = {640, 640}
+  std::vector<int> GetSize() const { return size_; }
+
+  /// Set padding value, size should be the same as channels
+  void SetPaddingColorValue(const std::vector<float>& padding_color_value) {
+    padding_color_value_ = padding_color_value;
+  }
+
+  /// Get padding value, size should be the same as channels
+  std::vector<float> GetPaddingColorValue() const {
+    return padding_color_value_;
+  }
+
+  /// Set is_scale_up, if is_scale_up is false, the input image only
+  /// can be zoom out, the maximum resize scale cannot exceed 1.0, default true
+  void SetScaleUp(bool is_scale_up) {
+    is_scale_up_ = is_scale_up;
+  }
+
+  /// Get is_scale_up, default true
+  bool GetScaleUp() const { return is_scale_up_; }
+
+ protected:
+  bool Preprocess(FDMat * mat, FDTensor* output,
+                  std::map<std::string, std::array<float, 2>>* im_info);
+
+  void LetterBox(FDMat* mat);
+
+  // target size, tuple of (width, height), default size = {640, 640}
+  std::vector<int> size_;
+
+  // padding value, size should be the same as channels
+  std::vector<float> padding_color_value_;
+
+  // only pad to the minimum rectange which height and width is times of stride
+  bool is_mini_pad_;
+
+  // while is_mini_pad = false and is_no_pad = true,
+  // will resize the image to the set size
+  bool is_no_pad_;
+
+  // if is_scale_up is false, the input image only can be zoom out,
+  // the maximum resize scale cannot exceed 1.0
+  bool is_scale_up_;
+
+  // padding stride, for is_mini_pad
+  int stride_;
+
+  // for offseting the boxes by classes when using NMS
+  float max_wh_;
+};
+
+}  // namespace facedet
+
+}  // namespace vision
+
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/facedet/yolov7-face/yolov7face.cc b/fastdeploy/vision/facedet/yolov7-face/yolov7face.cc
new file mode 100644
index 000000000..7c2906f39
--- /dev/null
+++ b/fastdeploy/vision/facedet/yolov7-face/yolov7face.cc
@@ -0,0 +1,88 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision/facedet/yolov7-face/yolov7face.h"
+#include "fastdeploy/utils/perf.h"
+#include "fastdeploy/vision/utils/utils.h"
+
+namespace fastdeploy{
+
+namespace vision{
+
+namespace facedet{
+
+YOLOv7Face::YOLOv7Face(const std::string& model_file,
+                       const std::string& params_file,
+                       const RuntimeOption& custom_option,
+                       const ModelFormat& model_format) {
+  if (model_format == ModelFormat::ONNX) {
+    valid_cpu_backends = {Backend::ORT};
+    valid_gpu_backends = {Backend::ORT, Backend::TRT};
+  } else {
+    valid_cpu_backends = {Backend::PDINFER, Backend::ORT};
+    valid_gpu_backends = {Backend::PDINFER, Backend::ORT, Backend::TRT};
+  }
+  runtime_option = custom_option;
+  runtime_option.model_format = model_format;
+  runtime_option.model_file = model_file;
+  runtime_option.params_file = params_file;
+  initialized = Initialize();
+}
+
+bool YOLOv7Face::Initialize(){
+  if (!InitRuntime()){
+    FDERROR << "Failed to initialize fastdeploy backend." << std::endl;
+    return false;
+  }
+  return true;
+}
+
+bool YOLOv7Face::Predict(const cv::Mat& im, FaceDetectionResult* result){
+  std::vector<FaceDetectionResult> results;
+  if (!BatchPredict({im}, &results)) {
+    return false;
+  }
+  *result = std::move(results[0]);
+  return true;
+}
+
+bool YOLOv7Face::BatchPredict(const std::vector<cv::Mat>& images,
+                              std::vector<FaceDetectionResult>* results){
+  std::vector<FDMat> fd_images = WrapMat(images);
+  FDASSERT(images.size() == 1, "Only support batch = 1 now.");
+  std::vector<std::map<std::string, std::array<float, 2>>> ims_info;
+  if (!preprocessor_.Run(&fd_images, &reused_input_tensors_, &ims_info)) {
+    FDERROR << "Failed to preprocess the input image." << std::endl;
+    return false;
+  }
+
+  reused_input_tensors_[0].name = InputInfoOfRuntime(0).name;
+  if (!Infer(reused_input_tensors_, &reused_output_tensors_)) {
+    FDERROR << "Failed to inference by runtime." << std::endl;
+    return false;
+  }
+
+  if (!postprocessor_.Run(reused_output_tensors_, results, ims_info)){
+    FDERROR << "Failed to postprocess the inference results by runtime." << std::endl;
+    return false;
+  }
+
+  return true;
+}
+
+}  // namespace facedet
+
+}  // namespace vision
+
+}  // namespace fastdeploy
\ No newline at end of file
diff --git a/fastdeploy/vision/facedet/yolov7-face/yolov7face.h b/fastdeploy/vision/facedet/yolov7-face/yolov7face.h
new file mode 100644
index 000000000..6410fe590
--- /dev/null
+++ b/fastdeploy/vision/facedet/yolov7-face/yolov7face.h
@@ -0,0 +1,81 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+#include "fastdeploy/fastdeploy_model.h"
+#include "fastdeploy/vision/common/processors/transform.h"
+#include "fastdeploy/vision/common/result.h"
+#include "fastdeploy/vision/facedet/yolov7-face/preprocessor.h"
+#include "fastdeploy/vision/facedet/yolov7-face/postprocessor.h"
+
+namespace fastdeploy {
+
+namespace vision {
+
+namespace facedet {
+/*! @brief YOLOv7Face model object used when to load a YOLOv7Face model exported by YOLOv7Face.
+ */
+class FASTDEPLOY_DECL YOLOv7Face: public FastDeployModel{
+ public:
+  /** \brief  Set path of model file and the configuration of runtime.
+   *
+   * \param[in] model_file Path of model file, e.g ./yolov7face.onnx
+   * \param[in] params_file Path of parameter file, e.g ppyoloe/model.pdiparams, if the model format is ONNX, this parameter will be ignored
+   * \param[in] custom_option RuntimeOption for inference, the default will use cpu, and choose the backend defined in "valid_cpu_backends"
+   * \param[in] model_format Model format of the loaded model, default is ONNX format
+   */
+  YOLOv7Face(const std::string& model_file, const std::string& params_file = "",
+              const RuntimeOption& custom_option = RuntimeOption(),
+              const ModelFormat& model_format = ModelFormat::ONNX);
+
+  std::string ModelName() {return "yolov7-face";}
+
+  /** \brief Predict the detection result for an input image
+   *
+   * \param[in] img The input image data, comes from cv::imread(), is a 3-D array with layout HWC, BGR format
+   * \param[in] result The output detection result will be writen to this structure
+   * \return true if the prediction successed, otherwise false
+   */
+  virtual bool Predict(const cv::Mat& im, FaceDetectionResult* result);
+
+  /** \brief Predict the detection results for a batch of input images
+   *
+   * \param[in] imgs, The input image list, each element comes from cv::imread()
+   * \param[in] results The output detection result list
+   * \return true if the prediction successed, otherwise false
+   */
+  virtual bool BatchPredict(const std::vector<cv::Mat>& images,
+                            std::vector<FaceDetectionResult>* results);
+
+    /// Get preprocessor reference of YOLOv7Face
+  virtual Yolov7FacePreprocessor& GetPreprocessor() {
+    return preprocessor_;
+  }
+
+  /// Get postprocessor reference of YOLOv7Face
+  virtual Yolov7FacePostprocessor& GetPostprocessor() {
+    return postprocessor_;
+  }
+
+ protected:
+  bool Initialize();
+  Yolov7FacePreprocessor preprocessor_;
+  Yolov7FacePostprocessor postprocessor_;
+};
+
+}  // namespace facedet
+
+}  // namespace vision
+
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/facedet/yolov7-face/yolov7face_pybind.cc b/fastdeploy/vision/facedet/yolov7-face/yolov7face_pybind.cc
new file mode 100644
index 000000000..c0c99d425
--- /dev/null
+++ b/fastdeploy/vision/facedet/yolov7-face/yolov7face_pybind.cc
@@ -0,0 +1,87 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/pybind/main.h"
+
+namespace fastdeploy {
+void BindYOLOv7Face(pybind11::module& m) {
+  pybind11::class_<vision::facedet::Yolov7FacePreprocessor>(
+      m, "Yolov7FacePreprocessor")
+      .def(pybind11::init<>())
+      .def("run", [](vision::facedet::Yolov7FacePreprocessor& self, std::vector<pybind11::array>& im_list) {
+        std::vector<vision::FDMat> images;
+        for (size_t i = 0; i < im_list.size(); ++i) {
+          images.push_back(vision::WrapMat(PyArrayToCvMat(im_list[i])));
+        }
+        std::vector<FDTensor> outputs;
+        std::vector<std::map<std::string, std::array<float, 2>>> ims_info;
+        if (!self.Run(&images, &outputs, &ims_info)) {
+          throw std::runtime_error("Failed to preprocess the input data in PaddleClasPreprocessor.");
+        }
+        for (size_t i = 0; i < outputs.size(); ++i) {
+          outputs[i].StopSharing();
+        }
+        return make_pair(outputs, ims_info);
+      })
+      .def_property("size", &vision::facedet::Yolov7FacePreprocessor::GetSize, &vision::facedet::Yolov7FacePreprocessor::SetSize)
+      .def_property("padding_color_value", &vision::facedet::Yolov7FacePreprocessor::GetPaddingColorValue, &vision::facedet::Yolov7FacePreprocessor::SetPaddingColorValue)
+      .def_property("is_scale_up", &vision::facedet::Yolov7FacePreprocessor::GetScaleUp, &vision::facedet::Yolov7FacePreprocessor::SetScaleUp);
+
+  pybind11::class_<vision::facedet::Yolov7FacePostprocessor>(
+      m, "YOLOv7FacePostprocessor")
+      .def(pybind11::init<>())
+      .def("run", [](vision::facedet::Yolov7FacePostprocessor& self, std::vector<FDTensor>& inputs,
+                     const std::vector<std::map<std::string, std::array<float, 2>>>& ims_info) {
+        std::vector<vision::FaceDetectionResult> results;
+        if (!self.Run(inputs, &results, ims_info)) {
+          throw std::runtime_error("Failed to postprocess the runtime result in Yolov7Postprocessor.");
+        }
+        return results; 
+      })
+      .def("run", [](vision::facedet::Yolov7FacePostprocessor& self, std::vector<pybind11::array>& input_array,
+                     const std::vector<std::map<std::string, std::array<float, 2>>>& ims_info) {
+        std::vector<vision::FaceDetectionResult> results;
+        std::vector<FDTensor> inputs;
+        PyArrayToTensorList(input_array, &inputs, /*share_buffer=*/true);
+        if (!self.Run(inputs, &results, ims_info)) {
+          throw std::runtime_error("Failed to postprocess the runtime result in YOLOv7Postprocessor.");
+        }
+        return results;
+      })
+      .def_property("conf_threshold", &vision::facedet::Yolov7FacePostprocessor::GetConfThreshold, &vision::facedet::Yolov7FacePostprocessor::SetConfThreshold)
+      .def_property("nms_threshold", &vision::facedet::Yolov7FacePostprocessor::GetNMSThreshold, &vision::facedet::Yolov7FacePostprocessor::SetNMSThreshold);
+    
+  pybind11::class_<vision::facedet::YOLOv7Face, FastDeployModel>(m, "YOLOv7Face")
+      .def(pybind11::init<std::string, std::string, RuntimeOption,
+                          ModelFormat>())
+      .def("predict",
+           [](vision::facedet::YOLOv7Face& self, pybind11::array& data) {
+             auto mat = PyArrayToCvMat(data);
+             vision::FaceDetectionResult res;
+             self.Predict(mat, &res);
+             return res;
+           })
+      .def("batch_predict", [](vision::facedet::YOLOv7Face& self, std::vector<pybind11::array>& data) {
+        std::vector<cv::Mat> images;
+        for (size_t i = 0; i < data.size(); ++i) {
+          images.push_back(PyArrayToCvMat(data[i]));
+        }
+        std::vector<vision::FaceDetectionResult> results;
+        self.BatchPredict(images, &results);
+        return results;
+      })
+      .def_property_readonly("preprocessor", &vision::facedet::YOLOv7Face::GetPreprocessor)
+      .def_property_readonly("postprocessor", &vision::facedet::YOLOv7Face::GetPostprocessor);
+}
+}  // namespace fastdeploy
diff --git a/python/fastdeploy/vision/facedet/__init__.py b/python/fastdeploy/vision/facedet/__init__.py
index c9fa01b60..869657a3c 100644
--- a/python/fastdeploy/vision/facedet/__init__.py
+++ b/python/fastdeploy/vision/facedet/__init__.py
@@ -14,6 +14,7 @@
 
 from __future__ import absolute_import
 from .contrib.yolov5face import YOLOv5Face
+from .contrib.yolov7face import *
 from .contrib.retinaface import RetinaFace
 from .contrib.scrfd import SCRFD
 from .contrib.ultraface import UltraFace
diff --git a/python/fastdeploy/vision/facedet/contrib/yolov7face.py b/python/fastdeploy/vision/facedet/contrib/yolov7face.py
new file mode 100644
index 000000000..262533b3a
--- /dev/null
+++ b/python/fastdeploy/vision/facedet/contrib/yolov7face.py
@@ -0,0 +1,166 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from __future__ import absolute_import
+import logging
+from .... import FastDeployModel, ModelFormat
+from .... import c_lib_wrap as C
+
+
+class Yolov7FacePreprocessor:
+    def __init__(self):
+        """Create a preprocessor for Yolov7Face
+        """
+        self._preprocessor = C.vision.facedet.Yolov7Preprocessor()
+
+    def run(self, input_ims):
+        """Preprocess input images for Yolov7Face
+
+        :param: input_ims: (list of numpy.ndarray)The input image
+        :return: list of FDTensor
+        """
+        return self._preprocessor.run(input_ims)
+
+    @property
+    def size(self):
+        """
+        Argument for image preprocessing step, the preprocess image size, tuple of (width, height), default size = [640, 640]
+        """
+        return self._preprocessor.size
+
+    @property
+    def padding_color_value(self):
+        """
+        padding value for preprocessing, default [114.0, 114.0, 114.0]
+        """
+        #  padding value, size should be the same as channels
+        return self._preprocessor.padding_color_value
+
+    @property
+    def is_scale_up(self):
+        """
+        is_scale_up for preprocessing, the input image only can be zoom out, the maximum resize scale cannot exceed 1.0, default true
+        """
+        return self._preprocessor.is_scale_up
+
+    @size.setter
+    def size(self, wh):
+        assert isinstance(wh, (list, tuple)),\
+            "The value to set `size` must be type of tuple or list."
+        assert len(wh) == 2,\
+            "The value to set `size` must contatins 2 elements means [width, height], but now it contains {} elements.".format(
+            len(wh))
+        self._preprocessor.size = wh
+
+    @padding_color_value.setter
+    def padding_color_value(self, value):
+        assert isinstance(
+            value, list
+        ), "The value to set `padding_color_value` must be type of list."
+        self._preprocessor.padding_color_value = value
+
+    @is_scale_up.setter
+    def is_scale_up(self, value):
+        assert isinstance(
+            value,
+            bool), "The value to set `is_scale_up` must be type of bool."
+        self._preprocessor.is_scale_up = value
+
+
+class Yolov7FacePostprocessor:
+    def __init__(self):
+        """Create a postprocessor for Yolov7Face
+        """
+        self._postprocessor = C.vision.facedet.Yolov7FacePostprocessor()
+
+    def run(self, runtime_results, ims_info):
+        """Postprocess the runtime results for Yolov7Face
+
+        :param: runtime_results: (list of FDTensor)The output FDTensor results from runtime
+        :param: ims_info: (list of dict)Record input_shape and output_shape
+        :return: list of DetectionResult(If the runtime_results is predict by batched samples, the length of this list equals to the batch size)
+        """
+        return self._postprocessor.run(runtime_results, ims_info)
+
+    @property
+    def conf_threshold(self):
+        """
+        confidence threshold for postprocessing, default is 0.5
+        """
+        return self._postprocessor.conf_threshold
+
+    @property
+    def nms_threshold(self):
+        """
+        nms threshold for postprocessing, default is 0.45
+        """
+        return self._postprocessor.nms_threshold
+
+    @conf_threshold.setter
+    def conf_threshold(self, conf_threshold):
+        assert isinstance(conf_threshold, float),\
+            "The value to set `conf_threshold` must be type of float."
+        self._postprocessor.conf_threshold = conf_threshold
+
+    @nms_threshold.setter
+    def nms_threshold(self, nms_threshold):
+        assert isinstance(nms_threshold, float),\
+            "The value to set `nms_threshold` must be type of float."
+        self._postprocessor.nms_threshold = nms_threshold
+
+
+class YOLOv7Face(FastDeployModel):
+    def __init__(self,
+                 model_file,
+                 params_file="",
+                 runtime_option=None,
+                 model_format=ModelFormat.ONNX):
+        """Load a YOLOv7Face model exported by YOLOv7Face.
+
+        :param model_file: (str)Path of model file, e.g ./yolov7face.onnx
+        :param params_file: (str)Path of parameters file, e.g yolox/model.pdiparams, if the model_fomat is ModelFormat.ONNX, this param will be ignored, can be set as empty string
+        :param runtime_option: (fastdeploy.RuntimeOption)RuntimeOption for inference this model, if it's None, will use the default backend on CPU
+        :param model_format: (fastdeploy.ModelForamt)Model format of the loaded model
+        """
+        super(YOLOv7Face, self).__init__(runtime_option)
+
+        self._model = C.vision.facedet.YOLOv7Face(
+            model_file, params_file, self._runtime_option, model_format)
+
+        assert self.initialized, "YOLOv7Face initialize failed."
+
+    def batch_predict(self, images):
+        """Classify a batch of input image
+
+        :param im: (list of numpy.ndarray) The input image list, each element is a 3-D array with layout HWC, BGR format
+        :return list of DetectionResult
+        """
+
+        return self._model.batch_predict(images)
+
+    @property
+    def preprocessor(self):
+        """Get YOLOv7Preprocessor object of the loaded model
+
+        :return YOLOv7Preprocessor
+        """
+        return self._model.preprocessor
+
+    @property
+    def postprocessor(self):
+        """Get YOLOv7Postprocessor object of the loaded model
+
+        :return YOLOv7Postprocessor
+        """
+        return self._model.postprocessor
diff --git a/tests/models/test_yolov7face.py b/tests/models/test_yolov7face.py
new file mode 100644
index 000000000..8589d708c
--- /dev/null
+++ b/tests/models/test_yolov7face.py
@@ -0,0 +1,142 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from fastdeploy import ModelFormat
+import fastdeploy as fd
+import cv2
+import os
+import pickle
+import numpy as np
+import runtime_config as rc
+
+
+def test_detection_yolov7face():
+    model_url = "https://bj.bcebos.com/paddlehub/fastdeploy/yolov7-lite-e.onnx"
+    input_url1 = "https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg"
+    input_url2 = "https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000570688.jpg"
+    result_url1 = "https://bj.bcebos.com/paddlehub/fastdeploy/yolov7face_result1.pkl"
+    result_url2 = "https://bj.bcebos.com/paddlehub/fastdeploy/yolov7face_result2.pkl"
+    fd.download(model_url, "resources")
+    fd.download(input_url1, "resources")
+    fd.download(input_url2, "resources")
+    fd.download(result_url1, "resources")
+    fd.download(result_url2, "resources")
+
+    model_file = "resources/yolov7-lite-e.onnx"
+    model = fd.vision.facedet.YOLOv7Face(
+        model_file, runtime_option=rc.test_option)
+    model.postprocessor.conf_threshold = 0.3
+
+    with open("resources/yolov7face_result1.pkl", "rb") as f:
+        expect1 = pickle.load(f)
+
+    with open("resources/yolov7face_result2.pkl", "rb") as f:
+        expect2 = pickle.load(f)
+
+    im1 = cv2.imread("./resources/000000014439.jpg")
+    im2 = cv2.imread("./resources/000000570688.jpg")
+
+    for i in range(3):
+        # test single predict
+        result1 = model.predict(im1)
+        result2 = model.predict(im2)
+
+        diff_boxes_1 = np.fabs(
+            np.array(result1.boxes) - np.array(expect1["boxes"]))
+        diff_boxes_2 = np.fabs(
+            np.array(result2.boxes) - np.array(expect2["boxes"]))
+
+        diff_scores_1 = np.fabs(
+            np.array(result1.scores) - np.array(expect1["scores"]))
+        diff_scores_2 = np.fabs(
+            np.array(result2.scores) - np.array(expect2["scores"]))
+
+        assert diff_boxes_1.max(
+        ) < 1e-03, "There's difference in detection boxes 1."
+        assert diff_scores_1.max(
+        ) < 1e-04, "There's difference in detection score 1."
+
+        assert diff_boxes_2.max(
+        ) < 1e-03, "There's difference in detection boxes 2."
+        assert diff_scores_2.max(
+        ) < 1e-04, "There's difference in detection score 2."
+
+        # test batch predict
+        results = model.batch_predict([im1, im2])
+        result1 = results[0]
+        result2 = results[1]
+
+        diff_boxes_1 = np.fabs(
+            np.array(result1.boxes) - np.array(expect1["boxes"]))
+        diff_boxes_2 = np.fabs(
+            np.array(result2.boxes) - np.array(expect2["boxes"]))
+
+        diff_scores_1 = np.fabs(
+            np.array(result1.scores) - np.array(expect1["scores"]))
+        diff_scores_2 = np.fabs(
+            np.array(result2.scores) - np.array(expect2["scores"]))
+        assert diff_boxes_1.max(
+        ) < 1e-03, "There's difference in detection boxes 1."
+        assert diff_scores_1.max(
+        ) < 1e-04, "There's difference in detection score 1."
+
+        assert diff_boxes_2.max(
+        ) < 1e-03, "There's difference in detection boxes 2."
+        assert diff_scores_2.max(
+        ) < 1e-04, "There's difference in detection score 2."
+
+
+def test_detection_yolov7face_runtime():
+    model_url = "https://bj.bcebos.com/paddlehub/fastdeploy/yolov7-lite-e.onnx"
+    input_url1 = "https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg"
+    result_url1 = "https://bj.bcebos.com/paddlehub/fastdeploy/yolov7_result1.pkl"
+    fd.download(model_url, "resources")
+    fd.download(input_url1, "resources")
+    fd.download(result_url1, "resources")
+
+    model_file = "resources/yolov7-lite-e.onnx"
+
+    preprocessor = fd.vision.detection.Yolov7FacePreprocessor()
+    postprocessor = fd.vision.detection.YOLOv7FacePostprocessor()
+
+    rc.test_option.set_model_path(model_file, model_format=ModelFormat.ONNX)
+    rc.test_option.use_openvino_backend()
+    runtime = fd.Runtime(rc.test_option)
+
+    with open("resources/yolov7_result1.pkl", "rb") as f:
+        expect1 = pickle.load(f)
+
+    im1 = cv2.imread("resources/000000014439.jpg")
+
+    for i in range(3):
+        # test runtime
+        input_tensors, ims_info = preprocessor.run([im1.copy()])
+        output_tensors = runtime.infer({"images": input_tensors[0]})
+        results = postprocessor.run(output_tensors, ims_info)
+        result1 = results[0]
+
+        diff_boxes_1 = np.fabs(
+            np.array(result1.boxes) - np.array(expect1["boxes"]))
+        diff_scores_1 = np.fabs(
+            np.array(result1.scores) - np.array(expect1["scores"]))
+
+        assert diff_boxes_1.max(
+        ) < 1e-03, "There's difference in detection boxes 1."
+        assert diff_scores_1.max(
+        ) < 1e-04, "There's difference in detection score 1."
+
+
+if __name__ == "__main__":
+    test_detection_yolov7face()
+    test_detection_yolov7face_runtime()

From ada54bfd471b564f77ce57498d6dd997000b4080 Mon Sep 17 00:00:00 2001
From: huangjianhui <852142024@qq.com>
Date: Wed, 14 Dec 2022 19:18:53 +0800
Subject: [PATCH 61/77] [Other]Update python && cpp multi_thread examples
 (#876)

* Refactor PaddleSeg with preprocessor && postprocessor

* Fix bugs

* Delete redundancy code

* Modify by comments

* Refactor according to comments

* Add batch evaluation

* Add single test script

* Add ppliteseg single test script && fix eval(raise) error

* fix bug

* Fix evaluation segmentation.py batch predict

* Fix segmentation evaluation bug

* Fix evaluation segmentation bugs

* Update segmentation result docs

* Update old predict api and DisableNormalizeAndPermute

* Update resize segmentation label map with cv::INTER_NEAREST

* Add Model Clone function for PaddleClas && PaddleDet && PaddleSeg

* Add multi thread demo

* Add python model clone function

* Add multi thread python && C++ example

* Fix bug

* Update python && cpp multi_thread examples

* Add cpp && python directory

* Add README.md for examples

* Delete redundant code

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 fastdeploy/vision/vision_pybind.cc            | 65 +++++++++++++++
 tutorials/multi_thread/cpp/CMakeLists.txt     | 14 ++++
 tutorials/multi_thread/cpp/README.md          | 79 +++++++++++++++++++
 .../{ => multi_thread/cpp}/multi_thread.cc    | 66 ++++++++++++----
 tutorials/multi_thread/python/README.md       | 77 ++++++++++++++++++
 .../python/multi_thread_process.py}           | 72 +++++++++++------
 6 files changed, 334 insertions(+), 39 deletions(-)
 create mode 100644 tutorials/multi_thread/cpp/CMakeLists.txt
 create mode 100644 tutorials/multi_thread/cpp/README.md
 rename tutorials/{ => multi_thread/cpp}/multi_thread.cc (64%)
 create mode 100644 tutorials/multi_thread/python/README.md
 rename tutorials/{multi_thread.py => multi_thread/python/multi_thread_process.py} (59%)

diff --git a/fastdeploy/vision/vision_pybind.cc b/fastdeploy/vision/vision_pybind.cc
index 55312d1a3..cecd4f7c3 100644
--- a/fastdeploy/vision/vision_pybind.cc
+++ b/fastdeploy/vision/vision_pybind.cc
@@ -37,6 +37,21 @@ void BindVision(pybind11::module& m) {
       .def(pybind11::init())
       .def_readwrite("data", &vision::Mask::data)
       .def_readwrite("shape", &vision::Mask::shape)
+      .def(pybind11::pickle(
+        [](const vision::Mask &m) { 
+            return pybind11::make_tuple(m.data, m.shape);
+        },
+        [](pybind11::tuple t) { 
+            if (t.size() != 2)
+                throw std::runtime_error("vision::Mask pickle with invalid state!");
+
+            vision::Mask m;
+            m.data = t[0].cast<std::vector<int32_t>>();
+            m.shape = t[1].cast<std::vector<int64_t>>();
+
+            return m;
+        }
+      ))
       .def("__repr__", &vision::Mask::Str)
       .def("__str__", &vision::Mask::Str);
 
@@ -44,6 +59,21 @@ void BindVision(pybind11::module& m) {
       .def(pybind11::init())
       .def_readwrite("label_ids", &vision::ClassifyResult::label_ids)
       .def_readwrite("scores", &vision::ClassifyResult::scores)
+      .def(pybind11::pickle(
+        [](const vision::ClassifyResult &c) { 
+            return pybind11::make_tuple(c.label_ids, c.scores);
+        },
+        [](pybind11::tuple t) { 
+            if (t.size() != 2)
+                throw std::runtime_error("vision::ClassifyResult pickle with invalid state!");
+
+            vision::ClassifyResult c;
+            c.label_ids = t[0].cast<std::vector<int32_t>>();
+            c.scores = t[1].cast<std::vector<float>>();
+
+            return c;
+        }
+      ))
       .def("__repr__", &vision::ClassifyResult::Str)
       .def("__str__", &vision::ClassifyResult::Str);
 
@@ -54,6 +84,24 @@ void BindVision(pybind11::module& m) {
       .def_readwrite("label_ids", &vision::DetectionResult::label_ids)
       .def_readwrite("masks", &vision::DetectionResult::masks)
       .def_readwrite("contain_masks", &vision::DetectionResult::contain_masks)
+      .def(pybind11::pickle(
+        [](const vision::DetectionResult &d) { 
+            return pybind11::make_tuple(d.boxes, d.scores, d.label_ids, d.masks, d.contain_masks);
+        },
+        [](pybind11::tuple t) { 
+            if (t.size() != 5)
+                throw std::runtime_error("vision::DetectionResult pickle with Invalid state!");
+
+            vision::DetectionResult d;
+            d.boxes = t[0].cast<std::vector<std::array<float, 4>>>();
+            d.scores = t[1].cast<std::vector<float>>();
+            d.label_ids = t[2].cast<std::vector<int32_t>>();
+            d.masks = t[3].cast<std::vector<vision::Mask>>();
+            d.contain_masks = t[4].cast<bool>();
+
+            return d;
+        }
+      ))
       .def("__repr__", &vision::DetectionResult::Str)
       .def("__str__", &vision::DetectionResult::Str);
 
@@ -104,6 +152,23 @@ void BindVision(pybind11::module& m) {
       .def_readwrite("score_map", &vision::SegmentationResult::score_map)
       .def_readwrite("shape", &vision::SegmentationResult::shape)
       .def_readwrite("contain_score_map", &vision::SegmentationResult::contain_score_map)
+      .def(pybind11::pickle(
+        [](const vision::SegmentationResult &s) { 
+            return pybind11::make_tuple(s.label_map, s.score_map, s.shape, s.contain_score_map);
+        },
+        [](pybind11::tuple t) { 
+            if (t.size() != 4)
+                throw std::runtime_error("vision::SegmentationResult pickle with Invalid state!");
+
+            vision::SegmentationResult s;
+            s.label_map = t[0].cast<std::vector<uint8_t>>();
+            s.score_map = t[1].cast<std::vector<float>>();
+            s.shape = t[2].cast<std::vector<int64_t>>();
+            s.contain_score_map = t[3].cast<bool>();
+
+            return s;
+        }
+      ))
       .def("__repr__", &vision::SegmentationResult::Str)
       .def("__str__", &vision::SegmentationResult::Str);
 
diff --git a/tutorials/multi_thread/cpp/CMakeLists.txt b/tutorials/multi_thread/cpp/CMakeLists.txt
new file mode 100644
index 000000000..d6882f897
--- /dev/null
+++ b/tutorials/multi_thread/cpp/CMakeLists.txt
@@ -0,0 +1,14 @@
+PROJECT(multi_thread_demo C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+# 指定下载解压后的fastdeploy库路径
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+
+# 添加FastDeploy依赖头文件
+include_directories(${FASTDEPLOY_INCS})
+
+add_executable(multi_thread_demo ${PROJECT_SOURCE_DIR}/multi_thread.cc)
+# 添加FastDeploy库依赖
+target_link_libraries(multi_thread_demo ${FASTDEPLOY_LIBS} pthread)
diff --git a/tutorials/multi_thread/cpp/README.md b/tutorials/multi_thread/cpp/README.md
new file mode 100644
index 000000000..066340467
--- /dev/null
+++ b/tutorials/multi_thread/cpp/README.md
@@ -0,0 +1,79 @@
+# PaddleClas C++部署示例
+
+本目录下提供`infer.cc`快速完成PaddleClas系列模型在CPU/GPU，以及GPU上通过TensorRT加速部署的示例。
+
+在部署前，需确认以下两个步骤
+
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
+- 2. 根据开发环境，下载预编译部署库和samples代码，参考[FastDeploy预编译库](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+以Linux上ResNet50_vd推理为例，在本目录执行如下命令即可完成编译测试，支持此模型需保证FastDeploy版本0.7.0以上(x.x.x>=0.7.0)
+
+```bash
+mkdir build
+cd build
+# 下载FastDeploy预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
+wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz
+tar xvf fastdeploy-linux-x64-x.x.x.tgz
+cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
+make -j
+
+# 下载ResNet50_vd模型文件和测试图片
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz
+tar -xvf ResNet50_vd_infer.tgz
+wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
+
+
+# CPU推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 0
+# GPU推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 1
+# GPU上TensorRT推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 2
+```
+
+以上命令只适用于Linux或MacOS, Windows下SDK的使用方式请参考:  
+- [如何在Windows中使用FastDeploy C++ SDK](../../../../../docs/cn/faq/use_sdk_on_windows.md)
+
+## PaddleClas C++接口
+
+### PaddleClas类
+
+```c++
+fastdeploy::vision::classification::PaddleClasModel(
+        const string& model_file,
+        const string& params_file,
+        const string& config_file,
+        const RuntimeOption& runtime_option = RuntimeOption(),
+        const ModelFormat& model_format = ModelFormat::PADDLE)
+```
+
+PaddleClas模型加载和初始化，其中model_file, params_file为训练模型导出的Paddle inference文件，具体请参考其文档说明[模型导出](https://github.com/PaddlePaddle/PaddleClas/blob/release/2.4/docs/zh_CN/inference_deployment/export_model.md#2-%E5%88%86%E7%B1%BB%E6%A8%A1%E5%9E%8B%E5%AF%BC%E5%87%BA)
+
+**参数**
+
+> * **model_file**(str): 模型文件路径
+> * **params_file**(str): 参数文件路径
+> * **config_file**(str): 推理部署配置文件
+> * **runtime_option**(RuntimeOption): 后端推理配置，默认为None，即采用默认配置
+> * **model_format**(ModelFormat): 模型格式，默认为Paddle格式
+
+#### Predict函数
+
+> ```c++
+> PaddleClasModel::Predict(cv::Mat* im, ClassifyResult* result, int topk = 1)
+> ```
+>
+> 模型预测接口，输入图像直接输出检测结果。
+>
+> **参数**
+>
+> > * **im**: 输入图像，注意需为HWC，BGR格式
+> > * **result**: 分类结果，包括label_id，以及相应的置信度, ClassifyResult说明参考[视觉模型预测结果](../../../../../docs/api/vision_results/)
+> > * **topk**(int):返回预测概率最高的topk个分类结果，默认为1
+
+
+- [模型介绍](../../)
+- [Python部署](../python)
+- [视觉模型预测结果](../../../../../docs/api/vision_results/)
+- [如何切换模型推理后端引擎](../../../../../docs/cn/faq/how_to_change_backend.md)
diff --git a/tutorials/multi_thread.cc b/tutorials/multi_thread/cpp/multi_thread.cc
similarity index 64%
rename from tutorials/multi_thread.cc
rename to tutorials/multi_thread/cpp/multi_thread.cc
index 6cc01b5d3..9c9d0ec5a 100644
--- a/tutorials/multi_thread.cc
+++ b/tutorials/multi_thread/cpp/multi_thread.cc
@@ -6,21 +6,44 @@ const char sep = '\\';
 const char sep = '/';
 #endif
 
-void predict(fastdeploy::vision::classification::PaddleClasModel *model, int thread_id, const std::string& image_file) {
-  auto im = cv::imread(image_file);
+void Predict(fastdeploy::vision::classification::PaddleClasModel *model, int thread_id, const std::vector<std::string>& images) {
+  for (auto const &image_file : images) {
+      auto im = cv::imread(image_file);
 
-  fastdeploy::vision::ClassifyResult res;
-  if (!model->Predict(im, &res)) {
-    std::cerr << "Failed to predict." << std::endl;
-    return;
+      fastdeploy::vision::ClassifyResult res;
+      if (!model->Predict(im, &res)) {
+        std::cerr << "Failed to predict." << std::endl;
+        return;
+      }
+
+      // print res
+      std::cout << "Thread Id: " << thread_id << std::endl;
+      std::cout << res.Str() << std::endl;
   }
-
-  // print res
-  std::cout << "Thread Id: " << thread_id << std::endl;
-  std::cout << res.Str() << std::endl;
 }
 
-void CpuInfer(const std::string& model_dir, const std::string& image_file, int thread_num) {
+void GetImageList(std::vector<std::vector<std::string>>* image_list, const std::string& image_file_path, int thread_num){
+  std::vector<cv::String> images;
+  cv::glob(image_file_path, images, false);
+  // number of image files in images folder
+  size_t count = images.size(); 
+  size_t num = count / thread_num;
+  for (int i = 0; i < thread_num; i++) {
+    std::vector<std::string> temp_list;
+    if (i == thread_num - 1) {
+      for (size_t j = i*num; j < count; j++){
+        temp_list.push_back(images[j]);
+      }
+    } else {
+      for (size_t j = 0; j < num; j++){
+        temp_list.push_back(images[i * num + j]);
+      }
+    }
+    (*image_list)[i] = temp_list;
+  }
+}
+
+void CpuInfer(const std::string& model_dir, const std::string& image_file_path, int thread_num) {
   auto model_file = model_dir + sep + "inference.pdmodel";
   auto params_file = model_dir + sep + "inference.pdiparams";
   auto config_file = model_dir + sep + "inference_cls.yaml";
@@ -39,9 +62,12 @@ void CpuInfer(const std::string& model_dir, const std::string& image_file, int t
     models.emplace_back(std::move(model.Clone()));
   }
 
+  std::vector<std::vector<std::string>> image_list(thread_num);
+  GetImageList(&image_list, image_file_path, thread_num);
+
   std::vector<std::thread> threads;
   for (int i = 0; i < thread_num; ++i) {
-    threads.emplace_back(predict, models[i].get(), i, image_file);
+    threads.emplace_back(Predict, models[i].get(), i, image_list[i]);
   }
 
   for (int i = 0; i < thread_num; ++i) {
@@ -49,7 +75,7 @@ void CpuInfer(const std::string& model_dir, const std::string& image_file, int t
   }
 }
 
-void GpuInfer(const std::string& model_dir, const std::string& image_file, int thread_num) {
+void GpuInfer(const std::string& model_dir, const std::string& image_file_path, int thread_num) {
   auto model_file = model_dir + sep + "inference.pdmodel";
   auto params_file = model_dir + sep + "inference.pdiparams";
   auto config_file = model_dir + sep + "inference_cls.yaml";
@@ -68,9 +94,12 @@ void GpuInfer(const std::string& model_dir, const std::string& image_file, int t
     models.emplace_back(std::move(model.Clone()));
   }
 
+  std::vector<std::vector<std::string>> image_list(thread_num);
+  GetImageList(&image_list, image_file_path, thread_num);
+
   std::vector<std::thread> threads;
   for (int i = 0; i < thread_num; ++i) {
-    threads.emplace_back(predict, models[i].get(), i, image_file);
+    threads.emplace_back(Predict, models[i].get(), i, image_list[i]);
   }
 
   for (int i = 0; i < thread_num; ++i) {
@@ -78,7 +107,7 @@ void GpuInfer(const std::string& model_dir, const std::string& image_file, int t
   }
 }
 
-void TrtInfer(const std::string& model_dir, const std::string& image_file, int thread_num) {
+void TrtInfer(const std::string& model_dir, const std::string& image_file_path, int thread_num) {
   auto model_file = model_dir + sep + "inference.pdmodel";
   auto params_file = model_dir + sep + "inference.pdiparams";
   auto config_file = model_dir + sep + "inference_cls.yaml";
@@ -99,9 +128,12 @@ void TrtInfer(const std::string& model_dir, const std::string& image_file, int t
     models.emplace_back(std::move(model.Clone()));
   }
 
+  std::vector<std::vector<std::string>> image_list(thread_num);
+  GetImageList(&image_list, image_file_path, thread_num);
+
   std::vector<std::thread> threads;
   for (int i = 0; i < thread_num; ++i) {
-    threads.emplace_back(predict, models[i].get(), i, image_file);
+    threads.emplace_back(Predict, models[i].get(), i, image_list[i]);
   }
 
   for (int i = 0; i < thread_num; ++i) {
@@ -112,7 +144,7 @@ void TrtInfer(const std::string& model_dir, const std::string& image_file, int t
 int main(int argc, char **argv) {
   if (argc < 5) {
     std::cout << "Usage: infer_demo path/to/model path/to/image run_option thread_num, "
-                 "e.g ./infer_demo ./ResNet50_vd ./test.jpeg 0 3"
+                 "e.g ./multi_thread_demo ./ResNet50_vd ./test.jpeg 0 3"
               << std::endl;
     std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
                  "with gpu; 2: run with gpu and use tensorrt backend."
diff --git a/tutorials/multi_thread/python/README.md b/tutorials/multi_thread/python/README.md
new file mode 100644
index 000000000..9d17e6f65
--- /dev/null
+++ b/tutorials/multi_thread/python/README.md
@@ -0,0 +1,77 @@
+# PaddleClas模型 Python部署示例
+
+在部署前，需确认以下两个步骤
+
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
+- 2. FastDeploy Python whl包安装，参考[FastDeploy Python安装](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+本目录下提供`infer.py`快速完成ResNet50_vd在CPU/GPU，以及GPU上通过TensorRT加速部署的示例。执行如下脚本即可完成
+
+```bash
+#下载部署示例代码
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd  FastDeploy/examples/vision/classification/paddleclas/python
+
+# 下载ResNet50_vd模型文件和测试图片
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz
+tar -xvf ResNet50_vd_infer.tgz
+wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
+
+# CPU推理
+python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device cpu --topk 1
+# GPU推理
+python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device gpu --topk 1
+# GPU上使用TensorRT推理 （注意：TensorRT推理第一次运行，有序列化模型的操作，有一定耗时，需要耐心等待）
+python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device gpu --use_trt True --topk 1
+# IPU推理（注意：IPU推理首次运行会有序列化模型的操作，有一定耗时，需要耐心等待）
+python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device ipu --topk 1
+```
+
+运行完成后返回结果如下所示
+```bash
+ClassifyResult(
+label_ids: 153,
+scores: 0.686229,
+)
+```
+
+## PaddleClasModel Python接口
+
+```python
+fd.vision.classification.PaddleClasModel(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
+```
+
+PaddleClas模型加载和初始化，其中model_file, params_file为训练模型导出的Paddle inference文件，具体请参考其文档说明[模型导出](https://github.com/PaddlePaddle/PaddleClas/blob/release/2.4/docs/zh_CN/inference_deployment/export_model.md#2-%E5%88%86%E7%B1%BB%E6%A8%A1%E5%9E%8B%E5%AF%BC%E5%87%BA)
+
+**参数**
+
+> * **model_file**(str): 模型文件路径
+> * **params_file**(str): 参数文件路径
+> * **config_file**(str): 推理部署配置文件
+> * **runtime_option**(RuntimeOption): 后端推理配置，默认为None，即采用默认配置
+> * **model_format**(ModelFormat): 模型格式，默认为Paddle格式
+
+### predict函数
+
+> ```python
+> PaddleClasModel.predict(input_image, topk=1)
+> ```
+>
+> 模型预测结口，输入图像直接输出分类topk结果。
+>
+> **参数**
+>
+> > * **input_image**(np.ndarray): 输入数据，注意需为HWC，BGR格式
+> > * **topk**(int):返回预测概率最高的topk个分类结果，默认为1
+
+> **返回**
+>
+> > 返回`fastdeploy.vision.ClassifyResult`结构体，结构体说明参考文档[视觉模型预测结果](../../../../../docs/api/vision_results/)
+
+
+## 其它文档
+
+- [PaddleClas 模型介绍](..)
+- [PaddleClas C++部署](../cpp)
+- [模型预测结果说明](../../../../../docs/api/vision_results/)
+- [如何切换模型推理后端引擎](../../../../../docs/cn/faq/how_to_change_backend.md)
diff --git a/tutorials/multi_thread.py b/tutorials/multi_thread/python/multi_thread_process.py
similarity index 59%
rename from tutorials/multi_thread.py
rename to tutorials/multi_thread/python/multi_thread_process.py
index 27d3b3331..edeee6a06 100644
--- a/tutorials/multi_thread.py
+++ b/tutorials/multi_thread/python/multi_thread_process.py
@@ -4,6 +4,7 @@ import fastdeploy as fd
 import cv2
 import os
 import psutil
+from multiprocessing import Pool
 
 
 def parse_arguments():
@@ -31,6 +32,13 @@ def parse_arguments():
         default=False,
         help="Wether to use tensorrt.")
     parser.add_argument("--thread_num", type=int, default=1, help="thread num")
+    parser.add_argument(
+        "--use_multi_process",
+        type=ast.literal_eval,
+        default=False,
+        help="Wether to use multi process.")
+    parser.add_argument(
+        "--process_num", type=int, default=1, help="process num")
     return parser.parse_args()
 
 
@@ -71,7 +79,7 @@ def build_option(args):
 
 def predict(model, img_list, topk):
     result_list = []
-    # 预测图片分类结果
+    # predict classification result
     for image in img_list:
         im = cv2.imread(image)
         result = model.predict(im, topk)
@@ -79,6 +87,13 @@ def predict(model, img_list, topk):
     return result_list
 
 
+def process_predict(image):
+    # predict classification result
+    im = cv2.imread(image)
+    result = model.predict(im, args.topk)
+    return result
+
+
 class WrapperThread(Thread):
     def __init__(self, func, args):
         super(WrapperThread, self).__init__()
@@ -95,9 +110,8 @@ class WrapperThread(Thread):
 if __name__ == '__main__':
     args = parse_arguments()
 
-    thread_num = args.thread_num
     imgs_list = get_image_list(args.image_path)
-    # 配置runtime，加载模型
+    # configure runtime and load model
     runtime_option = build_option(args)
 
     model_file = os.path.join(args.model, "inference.pdmodel")
@@ -105,24 +119,38 @@ if __name__ == '__main__':
     config_file = os.path.join(args.model, "inference_cls.yaml")
     model = fd.vision.classification.PaddleClasModel(
         model_file, params_file, config_file, runtime_option=runtime_option)
-    threads = []
-    image_num_each_thread = int(len(imgs_list) / thread_num)
-    for i in range(thread_num):
-        if i == thread_num - 1:
-            t = WrapperThread(
-                predict,
-                args=(model, imgs_list[i * image_num_each_thread:], i))
-        else:
-            t = WrapperThread(
-                predict,
-                args=(model.clone(), imgs_list[i * image_num_each_thread:(
-                    i + 1) * image_num_each_thread - 1], i))
-        threads.append(t)
-        t.start()
+    if args.use_multi_process:
+        results = []
+        process_num = args.process_num
+        with Pool(process_num) as pool:
+            results = pool.map(process_predict, imgs_list)
+        for result in results:
+            print(result)
+    else:
+        threads = []
+        thread_num = args.thread_num
+        image_num_each_thread = int(len(imgs_list) / thread_num)
+        # unless you want independent model in each thread, actually model.clone()
+        # is the same as model when creating thead because of the existence of
+        # GIL(Global Interpreter Lock) in python. In addition, model.clone() will consume
+        # additional memory to store independent member variables
+        for i in range(thread_num):
+            if i == thread_num - 1:
+                t = WrapperThread(
+                    predict,
+                    args=(model.clone(), imgs_list[i * image_num_each_thread:],
+                          args.topk))
+            else:
+                t = WrapperThread(
+                    predict,
+                    args=(model.clone(), imgs_list[i * image_num_each_thread:(
+                        i + 1) * image_num_each_thread - 1], args.topk))
+            threads.append(t)
+            t.start()
 
-    for i in range(thread_num):
-        threads[i].join()
+        for i in range(thread_num):
+            threads[i].join()
 
-    for i in range(thread_num):
-        for result in threads[i].get_result():
-            print('thread:', i, ', result: ', result)
+        for i in range(thread_num):
+            for result in threads[i].get_result():
+                print('thread:', i, ', result: ', result)

From 9b4dc941b1db5d753981105496158451cfa6e966 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 19:23:03 +0800
Subject: [PATCH 62/77] Create README_CN.md

---
 tutorials/README_CN.md | 6 ++++++
 1 file changed, 6 insertions(+)
 create mode 100644 tutorials/README_CN.md

diff --git a/tutorials/README_CN.md b/tutorials/README_CN.md
new file mode 100644
index 000000000..707e0a31a
--- /dev/null
+++ b/tutorials/README_CN.md
@@ -0,0 +1,6 @@
+# 教程
+
+本目录下提供一些FastDeploy使用的教程。对于常见的模型部署，请直接参阅[FastDeploy/examples](../examples)下的代码示例。
+
+- Intel独立显卡/集成显卡部署 [见intel_gpu](intel_gpu)
+- 模型多线程调用 [见multi_thread](multi_thread)

From 574acfe3f1513fae3d9463fa3153ca7fc91ad046 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 19:23:47 +0800
Subject: [PATCH 63/77] Update README_CN.md

---
 tutorials/README_CN.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tutorials/README_CN.md b/tutorials/README_CN.md
index 707e0a31a..771bb8934 100644
--- a/tutorials/README_CN.md
+++ b/tutorials/README_CN.md
@@ -1,3 +1,6 @@
+[English](README.md) | 中文
+
+
 # 教程
 
 本目录下提供一些FastDeploy使用的教程。对于常见的模型部署，请直接参阅[FastDeploy/examples](../examples)下的代码示例。

From 8a3aede30555e20ea59a4709b1fe288c9153ec94 Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Wed, 14 Dec 2022 19:24:55 +0800
Subject: [PATCH 64/77] Create README.md

---
 tutorials/README.md | 13 +++++++++++++
 1 file changed, 13 insertions(+)
 create mode 100644 tutorials/README.md

diff --git a/tutorials/README.md b/tutorials/README.md
new file mode 100644
index 000000000..2d114e9d0
--- /dev/null
+++ b/tutorials/README.md
@@ -0,0 +1,13 @@
+English | [中文](README_CN.md)
+
+
+# Tutorials
+
+
+
+This directory provides some tutorials for FastDeploy. For other model deployment, please refer to the example [FastDeploy/examples](../examples) directly.
+
+
+-Intel independent graphics card/integrated graphics card deployment [see intel_gpu](intel_gpu)
+
+-Model multithreaded call [see multi_thread](multi_thread)

From 3fad8199282dc7d5a3a22e558d0209c24bfff04a Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Thu, 15 Dec 2022 11:29:35 +0800
Subject: [PATCH 65/77] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index b1dd06cd5..e8f014f6f 120000
--- a/README.md
+++ b/README.md
@@ -1 +1 @@
-README_EN.md
+README_CN.md

From 3164af65a4d8783df8848690234c351ab20c72b3 Mon Sep 17 00:00:00 2001
From: totorolin <97090522+totorolin@users.noreply.github.com>
Date: Thu, 15 Dec 2022 11:46:13 +0800
Subject: [PATCH 66/77] [Model] Support PaddleYOLO YOLOv5 YOLOv6 YOLOv7 RTMDet
 models (#857)

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

* Add files via upload

Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com>
---
 .../detection/paddledetection/README.md       |  19 ++-
 .../paddledetection/cpp/CMakeLists.txt        |  15 ++
 .../detection/paddledetection/cpp/README.md   |   4 +-
 .../paddledetection/cpp/infer_rtmdet.cc       | 129 ++++++++++++++++++
 .../paddledetection/cpp/infer_yolov5.cc       | 129 ++++++++++++++++++
 .../paddledetection/cpp/infer_yolov6.cc       | 129 ++++++++++++++++++
 .../paddledetection/cpp/infer_yolov7.cc       | 128 +++++++++++++++++
 .../paddledetection/python/README.md          |   4 +
 .../paddledetection/python/infer_rtmdet.py    |  59 ++++++++
 .../paddledetection/python/infer_yolov5.py    |  59 ++++++++
 .../paddledetection/python/infer_yolov6.py    |  59 ++++++++
 .../paddledetection/python/infer_yolov7.py    |  59 ++++++++
 fastdeploy/vision/detection/ppdet/model.h     |  64 +++++++++
 .../vision/detection/ppdet/ppdet_pybind.cc    |  16 +++
 .../vision/detection/ppdet/__init__.py        | 100 ++++++++++++++
 15 files changed, 968 insertions(+), 5 deletions(-)
 create mode 100644 examples/vision/detection/paddledetection/cpp/infer_rtmdet.cc
 create mode 100644 examples/vision/detection/paddledetection/cpp/infer_yolov5.cc
 create mode 100644 examples/vision/detection/paddledetection/cpp/infer_yolov6.cc
 create mode 100644 examples/vision/detection/paddledetection/cpp/infer_yolov7.cc
 create mode 100644 examples/vision/detection/paddledetection/python/infer_rtmdet.py
 create mode 100644 examples/vision/detection/paddledetection/python/infer_yolov5.py
 create mode 100644 examples/vision/detection/paddledetection/python/infer_yolov6.py
 create mode 100644 examples/vision/detection/paddledetection/python/infer_yolov7.py

diff --git a/examples/vision/detection/paddledetection/README.md b/examples/vision/detection/paddledetection/README.md
index 575b305bb..ae4ba494c 100644
--- a/examples/vision/detection/paddledetection/README.md
+++ b/examples/vision/detection/paddledetection/README.md
@@ -16,6 +16,10 @@
 - [FasterRCNN系列模型](https://github.com/PaddlePaddle/PaddleDetection/tree/release/2.4/configs/faster_rcnn)
 - [MaskRCNN系列模型](https://github.com/PaddlePaddle/PaddleDetection/tree/release/2.4/configs/mask_rcnn)
 - [SSD系列模型](https://github.com/PaddlePaddle/PaddleDetection/tree/release/2.5/configs/ssd)
+- [YOLOv5系列模型](https://github.com/PaddlePaddle/PaddleYOLO/tree/release/2.5/configs/yolov5)
+- [YOLOv6系列模型](https://github.com/PaddlePaddle/PaddleYOLO/tree/release/2.5/configs/yolov6)
+- [YOLOv7系列模型](https://github.com/PaddlePaddle/PaddleYOLO/tree/release/2.5/configs/yolov7)
+- [RTMDet系列模型](https://github.com/PaddlePaddle/PaddleYOLO/tree/release/2.5/configs/rtmdet)
 
 ## 导出部署模型
 
@@ -44,9 +48,18 @@
 | [yolox_s_300e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/yolox_s_300e_coco.tgz) | 35MB | Box AP 40.4% | |
 | [faster_rcnn_r50_vd_fpn_2x_coco](https://bj.bcebos.com/paddlehub/fastdeploy/faster_rcnn_r50_vd_fpn_2x_coco.tgz) | 160MB | Box AP 40.8%| 暂不支持TensorRT |
 | [mask_rcnn_r50_1x_coco](https://bj.bcebos.com/paddlehub/fastdeploy/mask_rcnn_r50_1x_coco.tgz) | 128M | Box AP 37.4%, Mask AP 32.8%| 暂不支持TensorRT、ORT |
-| [ssd_mobilenet_v1_300_120e_voc](https://bj.bcebos.com/paddlehub/fastdeploy/ssd_mobilenet_v1_300_120e_voc.tgz) | 21.7M | Box AP 73.8%| 暂不支持TensorRT、ORT |
-| [ssd_vgg16_300_240e_voc](https://bj.bcebos.com/paddlehub/fastdeploy/ssd_vgg16_300_240e_voc.tgz) | 97.7M | Box AP 77.8%| 暂不支持TensorRT、ORT |
-| [ssdlite_mobilenet_v1_300_coco](https://bj.bcebos.com/paddlehub/fastdeploy/ssdlite_mobilenet_v1_300_coco.tgz) | 24.4M | | 暂不支持TensorRT、ORT |
+| [ssd_mobilenet_v1_300_120e_voc](https://bj.bcebos.com/paddlehub/fastdeploy/ssd_mobilenet_v1_300_120e_voc.tgz) | 24.9M | Box AP 73.8%| 暂不支持TensorRT、ORT |
+| [ssd_vgg16_300_240e_voc](https://bj.bcebos.com/paddlehub/fastdeploy/ssd_vgg16_300_240e_voc.tgz) | 106.5M | Box AP 77.8%| 暂不支持TensorRT、ORT |
+| [ssdlite_mobilenet_v1_300_coco](https://bj.bcebos.com/paddlehub/fastdeploy/ssdlite_mobilenet_v1_300_coco.tgz) | 29.1M | | 暂不支持TensorRT、ORT |
+| [rtmdet_l_300e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/rtmdet_l_300e_coco.tgz) | 224M | Box AP 51.2%|  |
+| [rtmdet_s_300e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/rtmdet_s_300e_coco.tgz) | 42M | Box AP 44.5%|  |
+| [yolov5_l_300e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5_l_300e_coco.tgz) | 183M | Box AP 48.9%|  |
+| [yolov5_s_300e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5_s_300e_coco.tgz) | 31M | Box AP 37.6%|  |
+| [yolov6_l_300e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/yolov6_l_300e_coco.tgz) | 229M | Box AP 51.0%|  |
+| [yolov6_s_400e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/yolov6_s_400e_coco.tgz) | 68M | Box AP 43.4%|  |
+| [yolov7_l_300e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/yolov7_l_300e_coco.tgz) | 145M | Box AP 51.0%|  |
+| [yolov7_x_300e_coco](https://bj.bcebos.com/paddlehub/fastdeploy/yolov7_x_300e_coco.tgz) | 277M | Box AP 53.0%|  |
+
 ## 详细部署文档
 
 - [Python部署](python)
diff --git a/examples/vision/detection/paddledetection/cpp/CMakeLists.txt b/examples/vision/detection/paddledetection/cpp/CMakeLists.txt
index 9bbbdf32e..9382931a1 100644
--- a/examples/vision/detection/paddledetection/cpp/CMakeLists.txt
+++ b/examples/vision/detection/paddledetection/cpp/CMakeLists.txt
@@ -29,3 +29,18 @@ target_link_libraries(infer_ppyolo_demo ${FASTDEPLOY_LIBS})
 
 add_executable(infer_mask_rcnn_demo ${PROJECT_SOURCE_DIR}/infer_mask_rcnn.cc)
 target_link_libraries(infer_mask_rcnn_demo ${FASTDEPLOY_LIBS})
+
+add_executable(infer_ssd_demo ${PROJECT_SOURCE_DIR}/infer_ssd.cc)
+target_link_libraries(infer_ssd_demo ${FASTDEPLOY_LIBS})
+
+add_executable(infer_yolov5_demo ${PROJECT_SOURCE_DIR}/infer_yolov5.cc)
+target_link_libraries(infer_yolov5_demo ${FASTDEPLOY_LIBS})
+
+add_executable(infer_yolov6_demo ${PROJECT_SOURCE_DIR}/infer_yolov6.cc)
+target_link_libraries(infer_yolov6_demo ${FASTDEPLOY_LIBS})
+
+add_executable(infer_yolov7_demo ${PROJECT_SOURCE_DIR}/infer_yolov7.cc)
+target_link_libraries(infer_yolov7_demo ${FASTDEPLOY_LIBS})
+
+add_executable(infer_rtmdet_demo ${PROJECT_SOURCE_DIR}/infer_rtmdet.cc)
+target_link_libraries(infer_rtmdet_demo ${FASTDEPLOY_LIBS})
diff --git a/examples/vision/detection/paddledetection/cpp/README.md b/examples/vision/detection/paddledetection/cpp/README.md
index 63df0365a..d9217ab1e 100644
--- a/examples/vision/detection/paddledetection/cpp/README.md
+++ b/examples/vision/detection/paddledetection/cpp/README.md
@@ -1,6 +1,6 @@
 # PaddleDetection C++部署示例
 
-本目录下提供`infer_xxx.cc`快速完成PaddleDetection模型包括PPYOLOE/PicoDet/YOLOX/YOLOv3/PPYOLO/FasterRCNN在CPU/GPU，以及GPU上通过TensorRT加速部署的示例。
+本目录下提供`infer_xxx.cc`快速完成PaddleDetection模型包括PPYOLOE/PicoDet/YOLOX/YOLOv3/PPYOLO/FasterRCNN/YOLOv5/YOLOv6/YOLOv7/RTMDet在CPU/GPU，以及GPU上通过TensorRT加速部署的示例。
 
 在部署前，需确认以下两个步骤
 
@@ -41,7 +41,7 @@ tar xvf ppyoloe_crn_l_300e_coco.tgz
 
 ### 模型类
 
-PaddleDetection目前支持6种模型系列，类名分别为`PPYOLOE`, `PicoDet`, `PaddleYOLOX`, `PPYOLO`, `FasterRCNN`，所有类名的构造函数和预测函数在参数上完全一致，本文档以PPYOLOE为例讲解API
+PaddleDetection目前支持6种模型系列，类名分别为`PPYOLOE`, `PicoDet`, `PaddleYOLOX`, `PPYOLO`, `FasterRCNN`，`SSD`,`PaddleYOLOv5`,`PaddleYOLOv6`,`PaddleYOLOv7`,`RTMDet`所有类名的构造函数和预测函数在参数上完全一致，本文档以PPYOLOE为例讲解API
 ```c++
 fastdeploy::vision::detection::PPYOLOE(
         const string& model_file,
diff --git a/examples/vision/detection/paddledetection/cpp/infer_rtmdet.cc b/examples/vision/detection/paddledetection/cpp/infer_rtmdet.cc
new file mode 100644
index 000000000..6262353ff
--- /dev/null
+++ b/examples/vision/detection/paddledetection/cpp/infer_rtmdet.cc
@@ -0,0 +1,129 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void CpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseCpu();
+  auto model = fastdeploy::vision::detection::RTMDet(model_file, params_file,
+                                                     config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+  auto im_bak = im.clone();
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im_bak, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void GpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  auto model = fastdeploy::vision::detection::RTMDet(model_file, params_file,
+                                                     config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+  auto im_bak = im.clone();
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im_bak, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void TrtInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UseTrtBackend();
+  auto model = fastdeploy::vision::detection::RTMDet(model_file, params_file,
+                                                      config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 4) {
+    std::cout
+        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
+           "e.g ./infer_model ./ppyolo_dirname ./test.jpeg 0"
+        << std::endl;
+    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
+                 "with gpu."
+              << std::endl;
+    return -1;
+  }
+
+  if (std::atoi(argv[3]) == 0) {
+    CpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 1) {
+    GpuInfer(argv[1], argv[2]);
+  } else if(std::atoi(argv[3]) == 2){
+    TrtInfer(argv[1], argv[2]);
+  }
+  return 0;
+}
diff --git a/examples/vision/detection/paddledetection/cpp/infer_yolov5.cc b/examples/vision/detection/paddledetection/cpp/infer_yolov5.cc
new file mode 100644
index 000000000..c33441b7d
--- /dev/null
+++ b/examples/vision/detection/paddledetection/cpp/infer_yolov5.cc
@@ -0,0 +1,129 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void CpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseCpu();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv5(model_file, params_file,
+                                                     config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+  auto im_bak = im.clone();
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im_bak, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void GpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv5(model_file, params_file,
+                                                     config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+  auto im_bak = im.clone();
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im_bak, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void TrtInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UseTrtBackend();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv5(model_file, params_file,
+                                                      config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 4) {
+    std::cout
+        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
+           "e.g ./infer_model ./ppyolo_dirname ./test.jpeg 0"
+        << std::endl;
+    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
+                 "with gpu."
+              << std::endl;
+    return -1;
+  }
+
+  if (std::atoi(argv[3]) == 0) {
+    CpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 1) {
+    GpuInfer(argv[1], argv[2]);
+  } else if(std::atoi(argv[3]) == 2){
+    TrtInfer(argv[1], argv[2]);
+  }
+  return 0;
+}
diff --git a/examples/vision/detection/paddledetection/cpp/infer_yolov6.cc b/examples/vision/detection/paddledetection/cpp/infer_yolov6.cc
new file mode 100644
index 000000000..8b7405ff6
--- /dev/null
+++ b/examples/vision/detection/paddledetection/cpp/infer_yolov6.cc
@@ -0,0 +1,129 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void CpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseCpu();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv6(model_file, params_file,
+                                                     config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+  auto im_bak = im.clone();
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im_bak, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void GpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv6(model_file, params_file,
+                                                     config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+  auto im_bak = im.clone();
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im_bak, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void TrtInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UseTrtBackend();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv6(model_file, params_file,
+                                                      config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 4) {
+    std::cout
+        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
+           "e.g ./infer_model ./ppyolo_dirname ./test.jpeg 0"
+        << std::endl;
+    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
+                 "with gpu."
+              << std::endl;
+    return -1;
+  }
+
+  if (std::atoi(argv[3]) == 0) {
+    CpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 1) {
+    GpuInfer(argv[1], argv[2]);
+  } else if(std::atoi(argv[3]) == 2){
+    TrtInfer(argv[1], argv[2]);
+  }
+  return 0;
+}
diff --git a/examples/vision/detection/paddledetection/cpp/infer_yolov7.cc b/examples/vision/detection/paddledetection/cpp/infer_yolov7.cc
new file mode 100644
index 000000000..e13f5f545
--- /dev/null
+++ b/examples/vision/detection/paddledetection/cpp/infer_yolov7.cc
@@ -0,0 +1,128 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void CpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseCpu();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv7(model_file, params_file,
+                                                     config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+  auto im_bak = im.clone();
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im_bak, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void GpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv7(model_file, params_file,config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+  auto im_bak = im.clone();
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im_bak, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void TrtInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto config_file = model_dir + sep + "infer_cfg.yml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UseTrtBackend();
+  auto model = fastdeploy::vision::detection::PaddleYOLOv7(model_file, params_file,
+                                                      config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(&im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  std::cout << res.Str() << std::endl;
+  auto vis_im = fastdeploy::vision::VisDetection(im, res, 0.5);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 4) {
+    std::cout
+        << "Usage: infer_demo path/to/model_dir path/to/image run_option, "
+           "e.g ./infer_model ./ppyolo_dirname ./test.jpeg 0"
+        << std::endl;
+    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
+                 "with gpu."
+              << std::endl;
+    return -1;
+  }
+
+  if (std::atoi(argv[3]) == 0) {
+    CpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 1) {
+    GpuInfer(argv[1], argv[2]);
+  } else if(std::atoi(argv[3]) == 2){
+    TrtInfer(argv[1], argv[2]);
+  }
+  return 0;
+}
diff --git a/examples/vision/detection/paddledetection/python/README.md b/examples/vision/detection/paddledetection/python/README.md
index 7747ca071..993c1695d 100644
--- a/examples/vision/detection/paddledetection/python/README.md
+++ b/examples/vision/detection/paddledetection/python/README.md
@@ -41,6 +41,10 @@ fastdeploy.vision.detection.PPYOLO(model_file, params_file, config_file, runtime
 fastdeploy.vision.detection.FasterRCNN(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
 fastdeploy.vision.detection.MaskRCNN(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
 fastdeploy.vision.detection.SSD(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
+fastdeploy.vision.detection.PaddleYOLOv5(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
+fastdeploy.vision.detection.PaddleYOLOv6(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
+fastdeploy.vision.detection.PaddleYOLOv7(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
+fastdeploy.vision.detection.RTMDet(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
 ```
 
 PaddleDetection模型加载和初始化，其中model_file， params_file为导出的Paddle部署模型格式, config_file为PaddleDetection同时导出的部署配置yaml文件
diff --git a/examples/vision/detection/paddledetection/python/infer_rtmdet.py b/examples/vision/detection/paddledetection/python/infer_rtmdet.py
new file mode 100644
index 000000000..ec4c6cda8
--- /dev/null
+++ b/examples/vision/detection/paddledetection/python/infer_rtmdet.py
@@ -0,0 +1,59 @@
+import fastdeploy as fd
+import cv2
+import os
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model_dir",
+        required=True,
+        help="Path of PaddleDetection model directory")
+    parser.add_argument(
+        "--image", required=True, help="Path of test image file.")
+    parser.add_argument(
+        "--device",
+        type=str,
+        default='cpu',
+        help="Type of inference device, support 'cpu' or 'gpu'.")
+    parser.add_argument(
+        "--use_trt",
+        type=ast.literal_eval,
+        default=False,
+        help="Wether to use tensorrt.")
+    return parser.parse_args()
+
+
+def build_option(args):
+    option = fd.RuntimeOption()
+
+    if args.device.lower() == "gpu":
+        option.use_gpu()
+
+    if args.use_trt:
+        option.use_trt_backend()
+    return option
+
+
+args = parse_arguments()
+
+model_file = os.path.join(args.model_dir, "model.pdmodel")
+params_file = os.path.join(args.model_dir, "model.pdiparams")
+config_file = os.path.join(args.model_dir, "infer_cfg.yml")
+
+# 配置runtime，加载模型
+runtime_option = build_option(args)
+model = fd.vision.detection.RTMDet(
+    model_file, params_file, config_file, runtime_option=runtime_option)
+
+# 预测图片检测结果
+im = cv2.imread(args.image)
+result = model.predict(im.copy())
+print(result)
+
+# 预测结果可视化
+vis_im = fd.vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("visualized_result.jpg", vis_im)
+print("Visualized result save in ./visualized_result.jpg")
diff --git a/examples/vision/detection/paddledetection/python/infer_yolov5.py b/examples/vision/detection/paddledetection/python/infer_yolov5.py
new file mode 100644
index 000000000..ea6c764e2
--- /dev/null
+++ b/examples/vision/detection/paddledetection/python/infer_yolov5.py
@@ -0,0 +1,59 @@
+import fastdeploy as fd
+import cv2
+import os
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model_dir",
+        required=True,
+        help="Path of PaddleDetection model directory")
+    parser.add_argument(
+        "--image", required=True, help="Path of test image file.")
+    parser.add_argument(
+        "--device",
+        type=str,
+        default='cpu',
+        help="Type of inference device, support 'cpu' or 'gpu'.")
+    parser.add_argument(
+        "--use_trt",
+        type=ast.literal_eval,
+        default=False,
+        help="Wether to use tensorrt.")
+    return parser.parse_args()
+
+
+def build_option(args):
+    option = fd.RuntimeOption()
+
+    if args.device.lower() == "gpu":
+        option.use_gpu()
+
+    if args.use_trt:
+        option.use_trt_backend()
+    return option
+
+
+args = parse_arguments()
+
+model_file = os.path.join(args.model_dir, "model.pdmodel")
+params_file = os.path.join(args.model_dir, "model.pdiparams")
+config_file = os.path.join(args.model_dir, "infer_cfg.yml")
+
+# 配置runtime，加载模型
+runtime_option = build_option(args)
+model = fd.vision.detection.PaddleYOLOv5(
+    model_file, params_file, config_file, runtime_option=runtime_option)
+
+# 预测图片检测结果
+im = cv2.imread(args.image)
+result = model.predict(im.copy())
+print(result)
+
+# 预测结果可视化
+vis_im = fd.vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("visualized_result.jpg", vis_im)
+print("Visualized result save in ./visualized_result.jpg")
diff --git a/examples/vision/detection/paddledetection/python/infer_yolov6.py b/examples/vision/detection/paddledetection/python/infer_yolov6.py
new file mode 100644
index 000000000..81dfab331
--- /dev/null
+++ b/examples/vision/detection/paddledetection/python/infer_yolov6.py
@@ -0,0 +1,59 @@
+import fastdeploy as fd
+import cv2
+import os
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model_dir",
+        required=True,
+        help="Path of PaddleDetection model directory")
+    parser.add_argument(
+        "--image", required=True, help="Path of test image file.")
+    parser.add_argument(
+        "--device",
+        type=str,
+        default='cpu',
+        help="Type of inference device, support 'cpu' or 'gpu'.")
+    parser.add_argument(
+        "--use_trt",
+        type=ast.literal_eval,
+        default=False,
+        help="Wether to use tensorrt.")
+    return parser.parse_args()
+
+
+def build_option(args):
+    option = fd.RuntimeOption()
+
+    if args.device.lower() == "gpu":
+        option.use_gpu()
+
+    if args.use_trt:
+        option.use_trt_backend()
+    return option
+
+
+args = parse_arguments()
+
+model_file = os.path.join(args.model_dir, "model.pdmodel")
+params_file = os.path.join(args.model_dir, "model.pdiparams")
+config_file = os.path.join(args.model_dir, "infer_cfg.yml")
+
+# 配置runtime，加载模型
+runtime_option = build_option(args)
+model = fd.vision.detection.PaddleYOLOv6(
+    model_file, params_file, config_file, runtime_option=runtime_option)
+
+# 预测图片检测结果
+im = cv2.imread(args.image)
+result = model.predict(im.copy())
+print(result)
+
+# 预测结果可视化
+vis_im = fd.vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("visualized_result.jpg", vis_im)
+print("Visualized result save in ./visualized_result.jpg")
diff --git a/examples/vision/detection/paddledetection/python/infer_yolov7.py b/examples/vision/detection/paddledetection/python/infer_yolov7.py
new file mode 100644
index 000000000..d06332e02
--- /dev/null
+++ b/examples/vision/detection/paddledetection/python/infer_yolov7.py
@@ -0,0 +1,59 @@
+import fastdeploy as fd
+import cv2
+import os
+
+
+def parse_arguments():
+    import argparse
+    import ast
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--model_dir",
+        required=True,
+        help="Path of PaddleDetection model directory")
+    parser.add_argument(
+        "--image", required=True, help="Path of test image file.")
+    parser.add_argument(
+        "--device",
+        type=str,
+        default='cpu',
+        help="Type of inference device, support 'cpu' or 'gpu'.")
+    parser.add_argument(
+        "--use_trt",
+        type=ast.literal_eval,
+        default=False,
+        help="Wether to use tensorrt.")    
+    return parser.parse_args()
+
+
+def build_option(args):
+    option = fd.RuntimeOption()
+
+    if args.device.lower() == "gpu":
+        option.use_gpu()
+
+    if args.use_trt:
+        option.use_trt_backend()
+    return option
+
+
+args = parse_arguments()
+
+model_file = os.path.join(args.model_dir, "model.pdmodel")
+params_file = os.path.join(args.model_dir, "model.pdiparams")
+config_file = os.path.join(args.model_dir, "infer_cfg.yml")
+
+# 配置runtime，加载模型
+runtime_option = build_option(args)
+model = fd.vision.detection.PaddleYOLOv7(
+    model_file, params_file, config_file, runtime_option=runtime_option)
+
+# 预测图片检测结果
+im = cv2.imread(args.image)
+result = model.predict(im.copy())
+print(result)
+
+# 预测结果可视化
+vis_im = fd.vision.vis_detection(im, result, score_threshold=0.5)
+cv2.imwrite("visualized_result.jpg", vis_im)
+print("Visualized result save in ./visualized_result.jpg")
diff --git a/fastdeploy/vision/detection/ppdet/model.h b/fastdeploy/vision/detection/ppdet/model.h
index 44f574435..5175bc4e6 100755
--- a/fastdeploy/vision/detection/ppdet/model.h
+++ b/fastdeploy/vision/detection/ppdet/model.h
@@ -177,6 +177,70 @@ class FASTDEPLOY_DECL SSD : public PPDetBase {
   virtual std::string ModelName() const { return "PaddleDetection/SSD"; }
 };
 
+class FASTDEPLOY_DECL PaddleYOLOv5 : public PPDetBase {
+ public:
+  PaddleYOLOv5(const std::string& model_file, const std::string& params_file,
+               const std::string& config_file,
+               const RuntimeOption& custom_option = RuntimeOption(),
+               const ModelFormat& model_format = ModelFormat::PADDLE)
+      : PPDetBase(model_file, params_file, config_file, custom_option,
+                model_format) {
+    valid_cpu_backends = {Backend::ORT,Backend::PDINFER};
+    valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
+    initialized = Initialize();
+  }
+
+  virtual std::string ModelName() const { return "PaddleDetection/YOLOv5"; }
+};
+
+class FASTDEPLOY_DECL PaddleYOLOv6 : public PPDetBase {
+ public:
+  PaddleYOLOv6(const std::string& model_file, const std::string& params_file,
+               const std::string& config_file,
+               const RuntimeOption& custom_option = RuntimeOption(),
+               const ModelFormat& model_format = ModelFormat::PADDLE)
+      : PPDetBase(model_file, params_file, config_file, custom_option,
+                model_format) {
+    valid_cpu_backends = {Backend::OPENVINO, Backend::ORT,Backend::PDINFER};
+    valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
+    initialized = Initialize();
+  }
+
+  virtual std::string ModelName() const { return "PaddleDetection/YOLOv6"; }
+};
+
+class FASTDEPLOY_DECL PaddleYOLOv7 : public PPDetBase {
+ public:
+  PaddleYOLOv7(const std::string& model_file, const std::string& params_file,
+               const std::string& config_file,
+               const RuntimeOption& custom_option = RuntimeOption(),
+               const ModelFormat& model_format = ModelFormat::PADDLE)
+      : PPDetBase(model_file, params_file, config_file, custom_option,
+                model_format) {
+    valid_cpu_backends = {Backend::ORT,Backend::PDINFER};
+    valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
+    initialized = Initialize();
+  }
+
+  virtual std::string ModelName() const { return "PaddleDetection/YOLOv7"; }
+};
+
+class FASTDEPLOY_DECL RTMDet : public PPDetBase {
+ public:
+  RTMDet(const std::string& model_file, const std::string& params_file,
+         const std::string& config_file,
+         const RuntimeOption& custom_option = RuntimeOption(),
+         const ModelFormat& model_format = ModelFormat::PADDLE)
+      : PPDetBase(model_file, params_file, config_file, custom_option,
+                model_format) {
+    valid_cpu_backends = {Backend::OPENVINO, Backend::ORT, Backend::PDINFER};
+    valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
+    initialized = Initialize();
+  }
+
+  virtual std::string ModelName() const { return "PaddleDetection/RTMDet"; }
+};
+
 }  // namespace detection
 }  // namespace vision
 }  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/ppdet/ppdet_pybind.cc b/fastdeploy/vision/detection/ppdet/ppdet_pybind.cc
index e55561cdc..09c89dfce 100644
--- a/fastdeploy/vision/detection/ppdet/ppdet_pybind.cc
+++ b/fastdeploy/vision/detection/ppdet/ppdet_pybind.cc
@@ -115,5 +115,21 @@ void BindPPDet(pybind11::module& m) {
   pybind11::class_<vision::detection::SSD, vision::detection::PPDetBase>(m, "SSD")
       .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                           ModelFormat>());
+
+  pybind11::class_<vision::detection::PaddleYOLOv5, vision::detection::PPDetBase>(m, "PaddleYOLOv5")
+      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
+                          ModelFormat>());
+
+  pybind11::class_<vision::detection::PaddleYOLOv6, vision::detection::PPDetBase>(m, "PaddleYOLOv6")
+      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
+                          ModelFormat>());
+
+  pybind11::class_<vision::detection::PaddleYOLOv7, vision::detection::PPDetBase>(m, "PaddleYOLOv7")
+      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
+                          ModelFormat>());
+
+  pybind11::class_<vision::detection::RTMDet, vision::detection::PPDetBase>(m, "RTMDet")
+      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
+                          ModelFormat>());                               
 }
 }  // namespace fastdeploy
diff --git a/python/fastdeploy/vision/detection/ppdet/__init__.py b/python/fastdeploy/vision/detection/ppdet/__init__.py
index 2e84e8ce0..45734eef0 100644
--- a/python/fastdeploy/vision/detection/ppdet/__init__.py
+++ b/python/fastdeploy/vision/detection/ppdet/__init__.py
@@ -401,3 +401,103 @@ class SSD(PPYOLOE):
 
         clone_model = SSDClone(self._model.clone())
         return clone_model
+
+
+class PaddleYOLOv5(PPYOLOE):
+    def __init__(self,
+                 model_file,
+                 params_file,
+                 config_file,
+                 runtime_option=None,
+                 model_format=ModelFormat.PADDLE):
+        """Load a YOLOv5 model exported by PaddleDetection.
+
+        :param model_file: (str)Path of model file, e.g yolov5/model.pdmodel
+        :param params_file: (str)Path of parameters file, e.g yolov5/model.pdiparams, if the model_fomat is ModelFormat.ONNX, this param will be ignored, can be set as empty string
+        :param config_file: (str)Path of configuration file for deployment, e.g ppyoloe/infer_cfg.yml
+        :param runtime_option: (fastdeploy.RuntimeOption)RuntimeOption for inference this model, if it's None, will use the default backend on CPU
+        :param model_format: (fastdeploy.ModelForamt)Model format of the loaded model
+        """
+
+        super(PPYOLOE, self).__init__(runtime_option)
+
+        assert model_format == ModelFormat.PADDLE, "PaddleYOLOv5 model only support model format of ModelFormat.Paddle now."
+        self._model = C.vision.detection.PaddleYOLOv5(
+            model_file, params_file, config_file, self._runtime_option,
+            model_format)
+        assert self.initialized, "PaddleYOLOv5 model initialize failed."
+
+
+class PaddleYOLOv6(PPYOLOE):
+    def __init__(self,
+                 model_file,
+                 params_file,
+                 config_file,
+                 runtime_option=None,
+                 model_format=ModelFormat.PADDLE):
+        """Load a YOLOv6 model exported by PaddleDetection.
+
+        :param model_file: (str)Path of model file, e.g yolov6/model.pdmodel
+        :param params_file: (str)Path of parameters file, e.g yolov6/model.pdiparams, if the model_fomat is ModelFormat.ONNX, this param will be ignored, can be set as empty string
+        :param config_file: (str)Path of configuration file for deployment, e.g ppyoloe/infer_cfg.yml
+        :param runtime_option: (fastdeploy.RuntimeOption)RuntimeOption for inference this model, if it's None, will use the default backend on CPU
+        :param model_format: (fastdeploy.ModelForamt)Model format of the loaded model
+        """
+
+        super(PPYOLOE, self).__init__(runtime_option)
+
+        assert model_format == ModelFormat.PADDLE, "PaddleYOLOv6 model only support model format of ModelFormat.Paddle now."
+        self._model = C.vision.detection.PaddleYOLOv6(
+            model_file, params_file, config_file, self._runtime_option,
+            model_format)
+        assert self.initialized, "PaddleYOLOv6 model initialize failed."
+
+
+class PaddleYOLOv7(PPYOLOE):
+    def __init__(self,
+                 model_file,
+                 params_file,
+                 config_file,
+                 runtime_option=None,
+                 model_format=ModelFormat.PADDLE):
+        """Load a YOLOv7 model exported by PaddleDetection.
+
+        :param model_file: (str)Path of model file, e.g yolov7/model.pdmodel
+        :param params_file: (str)Path of parameters file, e.g yolov7/model.pdiparams, if the model_fomat is ModelFormat.ONNX, this param will be ignored, can be set as empty string
+        :param config_file: (str)Path of configuration file for deployment, e.g ppyoloe/infer_cfg.yml
+        :param runtime_option: (fastdeploy.RuntimeOption)RuntimeOption for inference this model, if it's None, will use the default backend on CPU
+        :param model_format: (fastdeploy.ModelForamt)Model format of the loaded model
+        """
+
+        super(PPYOLOE, self).__init__(runtime_option)
+
+        assert model_format == ModelFormat.PADDLE, "PaddleYOLOv7 model only support model format of ModelFormat.Paddle now."
+        self._model = C.vision.detection.PaddleYOLOv7(
+            model_file, params_file, config_file, self._runtime_option,
+            model_format)
+        assert self.initialized, "PaddleYOLOv7 model initialize failed."
+
+
+class RTMDet(PPYOLOE):
+    def __init__(self,
+                 model_file,
+                 params_file,
+                 config_file,
+                 runtime_option=None,
+                 model_format=ModelFormat.PADDLE):
+        """Load a RTMDet model exported by PaddleDetection.
+
+        :param model_file: (str)Path of model file, e.g rtmdet/model.pdmodel
+        :param params_file: (str)Path of parameters file, e.g rtmdet/model.pdiparams, if the model_fomat is ModelFormat.ONNX, this param will be ignored, can be set as empty string
+        :param config_file: (str)Path of configuration file for deployment, e.g ppyoloe/infer_cfg.yml
+        :param runtime_option: (fastdeploy.RuntimeOption)RuntimeOption for inference this model, if it's None, will use the default backend on CPU
+        :param model_format: (fastdeploy.ModelForamt)Model format of the loaded model
+        """
+
+        super(PPYOLOE, self).__init__(runtime_option)
+
+        assert model_format == ModelFormat.PADDLE, "RTMDet model only support model format of ModelFormat.Paddle now."
+        self._model = C.vision.detection.RTMDet(
+            model_file, params_file, config_file, self._runtime_option,
+            model_format)
+        assert self.initialized, "RTMDet model initialize failed."
\ No newline at end of file

From e4b1581593e4368100306abf002fb53480239bed Mon Sep 17 00:00:00 2001
From: huangjianhui <852142024@qq.com>
Date: Thu, 15 Dec 2022 14:53:44 +0800
Subject: [PATCH 67/77] [Doc] Update multi_thread docs in tutorials (#886)

* Refactor PaddleSeg with preprocessor && postprocessor

* Fix bugs

* Delete redundancy code

* Modify by comments

* Refactor according to comments

* Add batch evaluation

* Add single test script

* Add ppliteseg single test script && fix eval(raise) error

* fix bug

* Fix evaluation segmentation.py batch predict

* Fix segmentation evaluation bug

* Fix evaluation segmentation bugs

* Update segmentation result docs

* Update old predict api and DisableNormalizeAndPermute

* Update resize segmentation label map with cv::INTER_NEAREST

* Add Model Clone function for PaddleClas && PaddleDet && PaddleSeg

* Add multi thread demo

* Add python model clone function

* Add multi thread python && C++ example

* Fix bug

* Update python && cpp multi_thread examples

* Add cpp && python directory

* Add README.md for examples

* Delete redundant code

* Create README_CN.md

* Rename README_CN.md to README.md

* Update README.md

* Update README.md

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 tutorials/multi_thread/README.md        | 96 +++++++++++++++++++++++++
 tutorials/multi_thread/cpp/README.md    | 66 ++++-------------
 tutorials/multi_thread/python/README.md | 83 ++++++++-------------
 3 files changed, 136 insertions(+), 109 deletions(-)
 create mode 100644 tutorials/multi_thread/README.md

diff --git a/tutorials/multi_thread/README.md b/tutorials/multi_thread/README.md
new file mode 100644
index 000000000..00bc7251c
--- /dev/null
+++ b/tutorials/multi_thread/README.md
@@ -0,0 +1,96 @@
+[English](README.md) | 中文
+
+# FastDeploy模型多线程或多进程预测的使用
+
+FastDeploy针对python和cpp开发者，提供了以下多线程或多进程的示例
+
+- [python多线程以及多进程预测的使用示例](python)
+- [cpp多线程预测的使用示例](cpp)
+
+## 多线程预测时克隆模型
+
+针对一个视觉模型的推理包含3个环节
+- 输入图像，图像经过预处理，最终得到要输入给模型Runtime的Tensor，即preprocess阶段
+- 模型Runtime接收Tensor，进行推理，得到Runtime的输出Tensor，即infer阶段
+- 对Runtime的输出Tensor做后处理，得到最后的结构化信息，如DetectionResult, SegmentationResult等等，即postprocess阶段
+
+针对以上preprocess、infer、postprocess三个阶段，FastDeploy分别抽象出了三个对应的类，即Preprocessor、Runtime、PostProcessor
+
+在多线程调用FastDeploy中的模型进行并行推理的时候，要考虑几个问题
+- Preprocessor、Runtime、Postprocessor三个类能否分别支持并行处理
+- 在支持多线程并发的前提下，能否最大限度的减少内存或显存占用
+
+FastDeploy采用分别拷贝多个对象的方式，进行多线程推理，即每个线程都有一份独立的Preprocessor、Runtime、PostProcessor的实例化的对象。而为了减少内存的占用，对于Runtime的拷贝则采用共享模型权重的方式进行拷贝。因此，虽然复制了多个对象，但对于模型权重和参数在内存或显存中只有一份。
+以此减少拷贝多个对象带来的内存占用。
+
+FastDeploy提供如下接口，来进行模型的clone(以PaddleClas为例)
+
+- Python: `PaddleClasModel.clone()`
+- C++: `PaddleClasModel::Clone()`
+
+
+### Python
+```
+import fastdeploy as fd
+option = fd.RuntimeOption()
+model = fd.vision.classification.PaddleClasModel(model_file, 
+                                                 params_file, 
+                                                 config_file, 
+                                                 runtime_option=option)
+model2 = model.clone()
+im = cv2.imread(image)
+res = model.predict(im)
+```
+
+### C++
+```
+auto model = fastdeploy::vision::classification::PaddleClasModel(model_file, 
+                                                                 params_file, 
+                                                                 config_file, 
+                                                                 option);
+auto model2 = model.Clone();
+auto im = cv::imread(image_file);
+fastdeploy::vision::ClassifyResult res;
+model->Predict(im, &res)
+```
+
+>> **注意**:其他模型类似API接口可查阅[官方C++文档](https://www.paddlepaddle.org.cn/fastdeploy-api-doc/cpp/html/index.html)以及[官方Python文档](https://www.paddlepaddle.org.cn/fastdeploy-api-doc/python/html/index.html)
+
+## Python多线程以及多进程
+
+Python由于语言的限制即GIL锁的存在，在计算密集型的场景下，多线程无法充分利用硬件的性能。因此，Python上提供多进程和多线程两种示例。其异同点如下：
+
+### FastDeploy模型多进程与多线程推理的比较
+
+|     | 资源占用 | 计算密集型 | I/O密集型 | 进程或线程间通信 |
+|:-------|:------|:----------|:----------|:----------|
+| 多进程   | 大 | 快 | 快 | 慢|
+| 多线程   | 小 | 慢 | 较快 |快|
+
+>> **注意**:以上分析相对理论，实际上Python针对不同的计算任务也做出了一定的优化，像是numpy类的计算已经可以做到并行计算，同时由于多进程间的result汇总涉及到进程间通信，而且往往有时候很难鉴别该任务是计算密集型还是I/O密集型，所以一切都需要根据任务进行测试而定。
+
+
+## C++多线程
+
+C++的多线程，兼具了占用资源少，速度快的特点。因此，是使用多线程推理的最佳选择
+
+### C++ 多线程Clone与不Clone内存占用对比
+
+硬件：Intel(R) Xeon(R) Gold 6271C CPU @ 2.60GHz  
+模型：ResNet50_vd_infer  
+后端：CPU OPENVINO后端推理引擎
+
+单进程内初始化多个模型，内存占用
+| 模型数 | model.Clone()后 | Clone后model->predict()后    | 不Clone模型初始化后| 不Clone后model->predict()后 |
+|:--- |:----- |:----- |:----- |:----- |
+|1|322M |325M |322M|325M|
+|2|322M|325M|559M|560M|
+|3|322M|325M|771M|771M|
+
+模型多线程预测内存占用
+| 线程数 | model.Clone()后 | Clone后model->predict()后    | 不Clone模型初始化后| 不Clone后model->predict()后 |
+|:--- |:----- |:----- |:----- |:----- |
+|1|322M |337M |322M|337M|
+|2|322M|343M|548M|566M|
+|3|322M|347M|752M|784M|
+
diff --git a/tutorials/multi_thread/cpp/README.md b/tutorials/multi_thread/cpp/README.md
index 066340467..086d71d86 100644
--- a/tutorials/multi_thread/cpp/README.md
+++ b/tutorials/multi_thread/cpp/README.md
@@ -1,11 +1,11 @@
-# PaddleClas C++部署示例
+# PaddleClas C++多线程部署示例
 
-本目录下提供`infer.cc`快速完成PaddleClas系列模型在CPU/GPU，以及GPU上通过TensorRT加速部署的示例。
+本目录下提供`multi_thread.cc`快速完成PaddleClas系列模型在CPU/GPU，以及GPU上通过TensorRT加速多线程部署的示例。
 
 在部署前，需确认以下两个步骤
 
-- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
-- 2. 根据开发环境，下载预编译部署库和samples代码，参考[FastDeploy预编译库](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
+- 2. 根据开发环境，下载预编译部署库和samples代码，参考[FastDeploy预编译库](../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
 
 以Linux上ResNet50_vd推理为例，在本目录执行如下命令即可完成编译测试，支持此模型需保证FastDeploy版本0.7.0以上(x.x.x>=0.7.0)
 
@@ -24,56 +24,14 @@ tar -xvf ResNet50_vd_infer.tgz
 wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
 
 
-# CPU推理
-./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 0
-# GPU推理
-./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 1
-# GPU上TensorRT推理
-./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 2
+# CPU多线程推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 0 1
+# GPU多线程推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 1 1
+# GPU上TensorRT多线程推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 2 1
 ```
+>> **注意**: 最后一位数字表示线程数
 
 以上命令只适用于Linux或MacOS, Windows下SDK的使用方式请参考:  
-- [如何在Windows中使用FastDeploy C++ SDK](../../../../../docs/cn/faq/use_sdk_on_windows.md)
-
-## PaddleClas C++接口
-
-### PaddleClas类
-
-```c++
-fastdeploy::vision::classification::PaddleClasModel(
-        const string& model_file,
-        const string& params_file,
-        const string& config_file,
-        const RuntimeOption& runtime_option = RuntimeOption(),
-        const ModelFormat& model_format = ModelFormat::PADDLE)
-```
-
-PaddleClas模型加载和初始化，其中model_file, params_file为训练模型导出的Paddle inference文件，具体请参考其文档说明[模型导出](https://github.com/PaddlePaddle/PaddleClas/blob/release/2.4/docs/zh_CN/inference_deployment/export_model.md#2-%E5%88%86%E7%B1%BB%E6%A8%A1%E5%9E%8B%E5%AF%BC%E5%87%BA)
-
-**参数**
-
-> * **model_file**(str): 模型文件路径
-> * **params_file**(str): 参数文件路径
-> * **config_file**(str): 推理部署配置文件
-> * **runtime_option**(RuntimeOption): 后端推理配置，默认为None，即采用默认配置
-> * **model_format**(ModelFormat): 模型格式，默认为Paddle格式
-
-#### Predict函数
-
-> ```c++
-> PaddleClasModel::Predict(cv::Mat* im, ClassifyResult* result, int topk = 1)
-> ```
->
-> 模型预测接口，输入图像直接输出检测结果。
->
-> **参数**
->
-> > * **im**: 输入图像，注意需为HWC，BGR格式
-> > * **result**: 分类结果，包括label_id，以及相应的置信度, ClassifyResult说明参考[视觉模型预测结果](../../../../../docs/api/vision_results/)
-> > * **topk**(int):返回预测概率最高的topk个分类结果，默认为1
-
-
-- [模型介绍](../../)
-- [Python部署](../python)
-- [视觉模型预测结果](../../../../../docs/api/vision_results/)
-- [如何切换模型推理后端引擎](../../../../../docs/cn/faq/how_to_change_backend.md)
+- [如何在Windows中使用FastDeploy C++ SDK](../../../docs/cn/faq/use_sdk_on_windows.md)
\ No newline at end of file
diff --git a/tutorials/multi_thread/python/README.md b/tutorials/multi_thread/python/README.md
index 9d17e6f65..508d5c7e0 100644
--- a/tutorials/multi_thread/python/README.md
+++ b/tutorials/multi_thread/python/README.md
@@ -1,31 +1,45 @@
-# PaddleClas模型 Python部署示例
+# PaddleClas模型 Python多线程/进程部署示例
 
 在部署前，需确认以下两个步骤
 
-- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
-- 2. FastDeploy Python whl包安装，参考[FastDeploy Python安装](../../../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+- 1. 软硬件环境满足要求，参考[FastDeploy环境要求](../../../docs/cn/build_and_install/download_prebuilt_libraries.md)  
+- 2. FastDeploy Python whl包安装，参考[FastDeploy Python安装](../../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+本目录下提供`multi_thread_process.py`快速完成ResNet50_vd在CPU/GPU，以及GPU上通过TensorRT加速部署的多线程/进程示例。执行如下脚本即可完成
 
-本目录下提供`infer.py`快速完成ResNet50_vd在CPU/GPU，以及GPU上通过TensorRT加速部署的示例。执行如下脚本即可完成
 
 ```bash
 #下载部署示例代码
 git clone https://github.com/PaddlePaddle/FastDeploy.git
-cd  FastDeploy/examples/vision/classification/paddleclas/python
+cd  FastDeploy/tutorials/multi_thread/python
 
 # 下载ResNet50_vd模型文件和测试图片
 wget https://bj.bcebos.com/paddlehub/fastdeploy/ResNet50_vd_infer.tgz
 tar -xvf ResNet50_vd_infer.tgz
 wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/ImageNet/ILSVRC2012_val_00000010.jpeg
 
-# CPU推理
-python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device cpu --topk 1
-# GPU推理
-python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device gpu --topk 1
-# GPU上使用TensorRT推理 （注意：TensorRT推理第一次运行，有序列化模型的操作，有一定耗时，需要耐心等待）
-python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device gpu --use_trt True --topk 1
-# IPU推理（注意：IPU推理首次运行会有序列化模型的操作，有一定耗时，需要耐心等待）
-python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device ipu --topk 1
+
+# CPU多线程推理
+python infer.py --model ResNet50_vd_infer --image_path ILSVRC2012_val_00000010.jpeg --device cpu --topk 1 --thread_num 1
+# CPU多进程推理
+python infer.py --model ResNet50_vd_infer --image_path ILSVRC2012_val_00000010.jpeg --device cpu --topk 1 --use_multi_process True --process_num 1
+
+# GPU多线程推理
+python infer.py --model ResNet50_vd_infer --image_path ILSVRC2012_val_00000010.jpeg --device gpu --topk 1 --thread_num 1
+# GPU多进程推理
+python infer.py --model ResNet50_vd_infer --image_path ILSVRC2012_val_00000010.jpeg --device gpu --topk 1 --use_multi_process True --process_num 1
+
+# GPU上使用TensorRT多线程推理 （注意：TensorRT推理第一次运行，有序列化模型的操作，有一定耗时，需要耐心等待）
+python infer.py --model ResNet50_vd_infer --image_path ILSVRC2012_val_00000010.jpeg --device gpu --use_trt True --topk 1 --thread_num 1
+# GPU上使用TensorRT多进程推理 （注意：TensorRT推理第一次运行，有序列化模型的操作，有一定耗时，需要耐心等待）
+python infer.py --model ResNet50_vd_infer --image_path ILSVRC2012_val_00000010.jpeg --device gpu --use_trt True --topk 1 --use_multi_process True --process_num 1
+
+# IPU多线程推理（注意：IPU推理首次运行会有序列化模型的操作，有一定耗时，需要耐心等待）
+python infer.py --model ResNet50_vd_infer --image_path ILSVRC2012_val_00000010.jpeg --device ipu --topk 1 --thread_num 1
+# IPU多进程推理（注意：IPU推理首次运行会有序列化模型的操作，有一定耗时，需要耐心等待）
+python infer.py --model ResNet50_vd_infer --image_path ILSVRC2012_val_00000010.jpeg --device ipu --topk 1 --use_multi_process True --process_num 1
 ```
+>> **注意**: `--image_path` 可以输入图片文件夹的路径
 
 运行完成后返回结果如下所示
 ```bash
@@ -33,45 +47,4 @@ ClassifyResult(
 label_ids: 153,
 scores: 0.686229,
 )
-```
-
-## PaddleClasModel Python接口
-
-```python
-fd.vision.classification.PaddleClasModel(model_file, params_file, config_file, runtime_option=None, model_format=ModelFormat.PADDLE)
-```
-
-PaddleClas模型加载和初始化，其中model_file, params_file为训练模型导出的Paddle inference文件，具体请参考其文档说明[模型导出](https://github.com/PaddlePaddle/PaddleClas/blob/release/2.4/docs/zh_CN/inference_deployment/export_model.md#2-%E5%88%86%E7%B1%BB%E6%A8%A1%E5%9E%8B%E5%AF%BC%E5%87%BA)
-
-**参数**
-
-> * **model_file**(str): 模型文件路径
-> * **params_file**(str): 参数文件路径
-> * **config_file**(str): 推理部署配置文件
-> * **runtime_option**(RuntimeOption): 后端推理配置，默认为None，即采用默认配置
-> * **model_format**(ModelFormat): 模型格式，默认为Paddle格式
-
-### predict函数
-
-> ```python
-> PaddleClasModel.predict(input_image, topk=1)
-> ```
->
-> 模型预测结口，输入图像直接输出分类topk结果。
->
-> **参数**
->
-> > * **input_image**(np.ndarray): 输入数据，注意需为HWC，BGR格式
-> > * **topk**(int):返回预测概率最高的topk个分类结果，默认为1
-
-> **返回**
->
-> > 返回`fastdeploy.vision.ClassifyResult`结构体，结构体说明参考文档[视觉模型预测结果](../../../../../docs/api/vision_results/)
-
-
-## 其它文档
-
-- [PaddleClas 模型介绍](..)
-- [PaddleClas C++部署](../cpp)
-- [模型预测结果说明](../../../../../docs/api/vision_results/)
-- [如何切换模型推理后端引擎](../../../../../docs/cn/faq/how_to_change_backend.md)
+```
\ No newline at end of file

From 6e79df40d987236e4bde34eb5a76b41784e32248 Mon Sep 17 00:00:00 2001
From: WJJ1995 <wjjisloser@163.com>
Date: Thu, 15 Dec 2022 17:23:27 +0800
Subject: [PATCH 68/77] [Model] Update YOLOv5 from 6.0 to 7.0 version (#890)

* add onnx_ort_runtime demo

* rm in requirements

* support batch eval

* fixed MattingResults bug

* move assignment for DetectionResult

* integrated x2paddle

* add model convert readme

* update readme

* re-lint

* add processor api

* Add MattingResult Free

* change valid_cpu_backends order

* add ppocr benchmark

* mv bs from 64 to 32

* fixed quantize.md

* fixed quantize bugs

* Add Monitor for benchmark

* update mem monitor

* Set trt_max_batch_size default 1

* fixed ocr benchmark bug

* support yolov5 in serving

* Fixed yolov5 serving

* Fixed postprocess

* update yolov5 to 7.0

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 examples/vision/detection/README.md        |  2 +-
 examples/vision/detection/yolov5/README.md | 20 +++++++++-----------
 2 files changed, 10 insertions(+), 12 deletions(-)

diff --git a/examples/vision/detection/README.md b/examples/vision/detection/README.md
index 3273ff602..522a4d79e 100644
--- a/examples/vision/detection/README.md
+++ b/examples/vision/detection/README.md
@@ -12,7 +12,7 @@ FastDeploy目前支持如下目标检测模型部署
 | [PaddleDetection/FasterRCNN](./paddledetection) | FasterRCNN系列模型 | Paddle | [Release/2.4](https://github.com/PaddlePaddle/PaddleDetection/tree/release/2.4) |
 | [WongKinYiu/YOLOv7](./yolov7) | YOLOv7、YOLOv7-X等系列模型 | ONNX | [Release/v0.1](https://github.com/WongKinYiu/yolov7/tree/v0.1) |
 | [RangiLyu/NanoDetPlus](./nanodet_plus) | NanoDetPlus 系列模型 | ONNX | [Release/v1.0.0-alpha-1](https://github.com/RangiLyu/nanodet/tree/v1.0.0-alpha-1) |
-| [ultralytics/YOLOv5](./yolov5) | YOLOv5 系列模型 | ONNX | [Release/v6.0](https://github.com/ultralytics/yolov5/tree/v6.0) |
+| [ultralytics/YOLOv5](./yolov5) | YOLOv5 系列模型 | ONNX | [Release/v7.0](https://github.com/ultralytics/yolov5/tree/v7.0) |
 | [ppogg/YOLOv5-Lite](./yolov5lite) | YOLOv5-Lite 系列模型 | ONNX | [Release/v1.4](https://github.com/ppogg/YOLOv5-Lite/releases/tag/v1.4) |
 | [meituan/YOLOv6](./yolov6) | YOLOv6 系列模型 | ONNX | [Release/0.1.0](https://github.com/meituan/YOLOv6/releases/tag/0.1.0) |
 | [WongKinYiu/YOLOR](./yolor) | YOLOR 系列模型 | ONNX | [Release/weights](https://github.com/WongKinYiu/yolor/releases/tag/weights) |
diff --git a/examples/vision/detection/yolov5/README.md b/examples/vision/detection/yolov5/README.md
index 076ae01ce..095c8071d 100644
--- a/examples/vision/detection/yolov5/README.md
+++ b/examples/vision/detection/yolov5/README.md
@@ -1,8 +1,8 @@
 # YOLOv5准备部署模型
 
-- YOLOv5 v6.0部署模型实现来自[YOLOv5](https://github.com/ultralytics/yolov5/tree/v6.0),和[基于COCO的预训练模型](https://github.com/ultralytics/yolov5/releases/tag/v6.0)
-  - （1）[官方库](https://github.com/ultralytics/yolov5/releases/tag/v6.0)提供的*.onnx可直接进行部署；
-  - （2）开发者基于自己数据训练的YOLOv5 v6.0模型，可使用[YOLOv5](https://github.com/ultralytics/yolov5)中的`export.py`导出ONNX文件后，完成部署。
+- YOLOv5 v7.0部署模型实现来自[YOLOv5](https://github.com/ultralytics/yolov5/tree/v7.0),和[基于COCO的预训练模型](https://github.com/ultralytics/yolov5/releases/tag/v7.0)
+  - （1）[官方库](https://github.com/ultralytics/yolov5/releases/tag/v7.0)提供的*.onnx可直接进行部署；
+  - （2）开发者基于自己数据训练的YOLOv5 v7.0模型，可使用[YOLOv5](https://github.com/ultralytics/yolov5)中的`export.py`导出ONNX文件后，完成部署。
 
 
 ## 下载预训练ONNX模型
@@ -10,13 +10,11 @@
 为了方便开发者的测试，下面提供了YOLOv5导出的各系列模型，开发者可直接下载使用。（下表中模型的精度来源于源官方库）
 | 模型                                                               | 大小    | 精度    |
 |:---------------------------------------------------------------- |:----- |:----- |
-| [YOLOv5n](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5n.onnx) | 7.5MB | 28.4% |
-| [YOLOv5s](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx) | 28.9MB | 37.2% |
-| [YOLOv5m](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5m.onnx) | 84.7MB | 45.2% |
-| [YOLOv5l](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5l.onnx) | 186.2MB | 48.8% |
-| [YOLOv5x](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5x.onnx) | 346.9MB | 50.7% |
-
-
+| [YOLOv5n](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5n.onnx) | 7.6MB | 28.0% |
+| [YOLOv5s](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx) | 28MB | 37.4% |
+| [YOLOv5m](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5m.onnx) | 82MB | 45.4% |
+| [YOLOv5l](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5l.onnx) | 178MB | 49.0% |
+| [YOLOv5x](https://bj.bcebos.com/paddlehub/fastdeploy/yolov5x.onnx) | 332MB | 50.7% |
 
 
 ## 详细部署文档
@@ -27,4 +25,4 @@
 
 ## 版本说明
 
-- 本版本文档和代码基于[YOLOv5 v6.0](https://github.com/ultralytics/yolov5/tree/v6.0) 编写
+- 本版本文档和代码基于[YOLOv5 v7.0](https://github.com/ultralytics/yolov5/tree/v7.0) 编写

From 5be839b322b6adf46329933361b22b4984c42ef8 Mon Sep 17 00:00:00 2001
From: yeliang2258 <30516196+yeliang2258@users.noreply.github.com>
Date: Thu, 15 Dec 2022 21:17:14 +0800
Subject: [PATCH 69/77] [Backend] Add KunlunXin XPU deploy support (#747)

* add xpu support

* fix docs

* update code

* update doc

* update code

* update yolov5

* update cmake

* add int64_t data support

* fix

* update download links

* add en doc

* update code

* update xpu options

* update doc

* update doc

* update doc

* update lib links

* update doc

* update code

* update lite xpu link

* update xpu lib

* update doc

* update en doc
---
 CMakeLists.txt                                |  20 ++-
 FastDeploy.cmake.in                           |   5 +
 cmake/summary.cmake                           |   2 +
 docs/README_CN.md                             |   1 +
 docs/README_EN.md                             |   5 +-
 docs/cn/build_and_install/README.md           |   8 +-
 docs/cn/build_and_install/a311d.md            |   3 +-
 docs/cn/build_and_install/rv1126.md           |   7 +-
 docs/cn/build_and_install/xpu.md              |  75 +++++++++
 docs/en/build_and_install/README.md           |   5 +
 docs/en/build_and_install/a311d.md            | 105 ++++++++++++
 docs/en/build_and_install/rv1126.md           | 105 ++++++++++++
 docs/en/build_and_install/xpu.md              |  78 +++++++++
 .../classification/paddleclas/cpp/README.md   |   4 +
 .../classification/paddleclas/cpp/infer.cc    |  30 +++-
 .../paddleclas/python/README.md               |   2 +
 .../classification/paddleclas/python/infer.py |   3 +
 .../detection/yolov5/cpp/CMakeLists.txt       |   4 +
 .../vision/detection/yolov5/cpp/README.md     |  24 ++-
 examples/vision/detection/yolov5/cpp/infer.cc |   2 +-
 .../yolov5/cpp/infer_paddle_model.cc          | 154 ++++++++++++++++++
 .../vision/detection/yolov5/python/README.md  |  11 +-
 .../vision/detection/yolov5/python/infer.py   |  21 ++-
 fastdeploy/backends/lite/lite_backend.cc      |  56 +++++--
 fastdeploy/backends/lite/lite_backend.h       |   9 +
 fastdeploy/core/fd_type.cc                    |   6 +
 fastdeploy/core/fd_type.h                     |   2 +-
 fastdeploy/fastdeploy_model.cc                |  33 +++-
 fastdeploy/fastdeploy_model.h                 |   4 +
 fastdeploy/pybind/runtime.cc                  |  17 +-
 fastdeploy/runtime.cc                         |  35 +++-
 fastdeploy/runtime.h                          |  41 +++++
 .../vision/classification/ppcls/model.cc      |   1 +
 .../detection/contrib/rknpu2/postprocessor.h  |   5 +-
 .../vision/detection/contrib/rknpu2/utils.h   |   2 +-
 .../vision/detection/contrib/yolov5/yolov5.cc |   1 +
 fastdeploy/vision/detection/ppdet/model.h     |   6 +-
 python/fastdeploy/runtime.py                  |  28 ++++
 python/setup.py                               |   8 +-
 39 files changed, 870 insertions(+), 58 deletions(-)
 mode change 100644 => 100755 docs/README_CN.md
 mode change 100644 => 100755 docs/README_EN.md
 create mode 100755 docs/cn/build_and_install/xpu.md
 mode change 100644 => 100755 docs/en/build_and_install/README.md
 create mode 100755 docs/en/build_and_install/a311d.md
 create mode 100755 docs/en/build_and_install/rv1126.md
 create mode 100755 docs/en/build_and_install/xpu.md
 mode change 100644 => 100755 examples/vision/classification/paddleclas/cpp/README.md
 mode change 100644 => 100755 examples/vision/classification/paddleclas/cpp/infer.cc
 mode change 100644 => 100755 examples/vision/classification/paddleclas/python/README.md
 mode change 100644 => 100755 examples/vision/classification/paddleclas/python/infer.py
 mode change 100644 => 100755 examples/vision/detection/yolov5/cpp/CMakeLists.txt
 mode change 100644 => 100755 examples/vision/detection/yolov5/cpp/README.md
 mode change 100644 => 100755 examples/vision/detection/yolov5/cpp/infer.cc
 create mode 100755 examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
 mode change 100644 => 100755 examples/vision/detection/yolov5/python/README.md
 mode change 100644 => 100755 examples/vision/detection/yolov5/python/infer.py
 mode change 100644 => 100755 fastdeploy/pybind/runtime.cc
 mode change 100644 => 100755 fastdeploy/runtime.cc

diff --git a/CMakeLists.txt b/CMakeLists.txt
index c02e887a5..0bcfa4084 100755
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -40,7 +40,7 @@ if(NOT MSVC)
   add_definitions(-D_GLIBCXX_USE_CXX11_ABI=1)
 endif(NOT MSVC)
 
-if(UNIX AND (NOT APPLE) AND (NOT ANDROID) AND (NOT ENABLE_TIMVX))
+if(UNIX AND (NOT APPLE) AND (NOT ANDROID) AND (NOT WITH_TIMVX))
   include(${PROJECT_SOURCE_DIR}/cmake/patchelf.cmake)
 endif()
 
@@ -64,7 +64,8 @@ option(ENABLE_LITE_BACKEND "Whether to enable paddle lite backend." OFF)
 option(ENABLE_VISION "Whether to enable vision models usage." OFF)
 option(ENABLE_TEXT "Whether to enable text models usage." OFF)
 option(ENABLE_FLYCV "Whether to enable flycv to boost image preprocess." OFF)
-option(ENABLE_TIMVX "Whether to compile for TIMVX deploy." OFF)
+option(WITH_TIMVX "Whether to compile for TIMVX deploy." OFF)
+option(WITH_XPU "Whether to compile for KunlunXin XPU deploy." OFF)
 option(WITH_TESTING "Whether to compile with unittest." OFF)
 ############################# Options for Android cross compiling #########################
 option(WITH_OPENCV_STATIC "Use OpenCV static lib for Android." OFF)
@@ -138,10 +139,23 @@ set(HEAD_DIR "${PROJECT_SOURCE_DIR}/${CSRCS_DIR_NAME}")
 include_directories(${HEAD_DIR})
 include_directories(${CMAKE_CURRENT_BINARY_DIR})
 
-if (ENABLE_TIMVX)
+if (WITH_TIMVX)
   include(${PROJECT_SOURCE_DIR}/cmake/timvx.cmake)
 endif()
 
+if (WITH_XPU)
+  if(NOT ENABLE_LITE_BACKEND)
+      message(WARNING "While compiling with -DWITH_XPU=ON, will force to set -DENABLE_LITE_BACKEND=ON")
+      set(ENABLE_LITE_BACKEND ON)
+  endif()
+  if(NOT CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "x86_64")
+    message(FATAL_ERROR "XPU is only supported on Linux x64 platform")
+  endif()
+  if(NOT PADDLELITE_URL)
+    set(PADDLELITE_URL "https://bj.bcebos.com/fastdeploy/third_libs/lite-linux-x64-xpu-20221215.tgz")
+  endif()
+endif()
+
 
 if(ANDROID OR IOS)
   if(ENABLE_ORT_BACKEND)
diff --git a/FastDeploy.cmake.in b/FastDeploy.cmake.in
index fd0ea847a..d8c0df3d6 100755
--- a/FastDeploy.cmake.in
+++ b/FastDeploy.cmake.in
@@ -27,6 +27,7 @@ set(OPENCV_DIRECTORY "@OPENCV_DIRECTORY@")
 set(ORT_DIRECTORY "@ORT_DIRECTORY@")
 set(OPENVINO_DIRECTORY "@OPENVINO_DIRECTORY@")
 set(RKNN2_TARGET_SOC "@RKNN2_TARGET_SOC@")
+set(WITH_XPU @WITH_XPU@)
 
 set(FASTDEPLOY_LIBS "")
 set(FASTDEPLOY_INCS "")
@@ -237,6 +238,10 @@ if(ENABLE_PADDLE_FRONTEND)
   list(APPEND FASTDEPLOY_LIBS ${PADDLE2ONNX_LIB})
 endif()
 
+if(WITH_XPU)
+  list(APPEND FASTDEPLOY_LIBS -lpthread -lrt -ldl)
+endif()
+
 remove_duplicate_libraries(FASTDEPLOY_LIBS)
 
 # Print compiler information
diff --git a/cmake/summary.cmake b/cmake/summary.cmake
index 7a729484e..fc5c246ba 100755
--- a/cmake/summary.cmake
+++ b/cmake/summary.cmake
@@ -37,6 +37,8 @@ function(fastdeploy_summary)
   message(STATUS "  ENABLE_POROS_BACKEND      : ${ENABLE_POROS_BACKEND}")
   message(STATUS "  ENABLE_TRT_BACKEND        : ${ENABLE_TRT_BACKEND}")
   message(STATUS "  ENABLE_OPENVINO_BACKEND   : ${ENABLE_OPENVINO_BACKEND}")
+  message(STATUS "  WITH_TIMVX                : ${WITH_TIMVX}")
+  message(STATUS "  WITH_XPU                  : ${WITH_XPU}")
   if(ENABLE_ORT_BACKEND)
     message(STATUS "  ONNXRuntime version       : ${ONNXRUNTIME_VERSION}")
   endif()
diff --git a/docs/README_CN.md b/docs/README_CN.md
old mode 100644
new mode 100755
index a0b7b51d0..ec0267f45
--- a/docs/README_CN.md
+++ b/docs/README_CN.md
@@ -8,6 +8,7 @@
 - [GPU部署环境编译安装](cn/build_and_install/gpu.md)
 - [CPU部署环境编译安装](cn/build_and_install/cpu.md)
 - [IPU部署环境编译安装](cn/build_and_install/ipu.md)
+- [昆仑芯XPU部署环境编译安装](cn/build_and_install/xpu.md)
 - [Jetson部署环境编译安装](cn/build_and_install/jetson.md)
 - [Android平台部署环境编译安装](cn/build_and_install/android.md)
 - [服务化部署镜像编译安装](../serving/docs/zh_CN/compile.md)
diff --git a/docs/README_EN.md b/docs/README_EN.md
old mode 100644
new mode 100755
index c4f9adfa3..ed257c59b
--- a/docs/README_EN.md
+++ b/docs/README_EN.md
@@ -8,6 +8,7 @@
 - [Build and Install FastDeploy Library on GPU Platform](en/build_and_install/gpu.md)
 - [Build and Install FastDeploy Library on CPU Platform](en/build_and_install/cpu.md)
 - [Build and Install FastDeploy Library on IPU Platform](en/build_and_install/ipu.md)
+- [Build and Install FastDeploy Library on KunlunXin XPU Platform](en/build_and_install/xpu.md)
 - [Build and Install FastDeploy Library on  Nvidia Jetson Platform](en/build_and_install/jetson.md)
 - [Build and Install FastDeploy Library on Android Platform](en/build_and_install/android.md)
 - [Build and Install FastDeploy Serving Deployment Image](../serving/docs/EN/compile-en.md)
@@ -19,10 +20,10 @@
 - [A Quick Start on Runtime Python](en/quick_start/runtime/python.md)
 - [A Quick Start on Runtime C++](en/quick_start/runtime/cpp.md)
 
-## API 
+## API
 
 - [Python API](https://baidu-paddle.github.io/fastdeploy-api/python/html/)
-- [C++ API](https://baidu-paddle.github.io/fastdeploy-api/cpp/html/) 
+- [C++ API](https://baidu-paddle.github.io/fastdeploy-api/cpp/html/)
 - [Android Java API](../java/android)
 
 ## Performance Optimization
diff --git a/docs/cn/build_and_install/README.md b/docs/cn/build_and_install/README.md
index 7ec07c7b8..221852d2c 100755
--- a/docs/cn/build_and_install/README.md
+++ b/docs/cn/build_and_install/README.md
@@ -13,6 +13,7 @@
 - [Android平台部署环境](android.md)
 - [瑞芯微RV1126部署环境](rv1126.md)
 - [晶晨A311D部署环境](a311d.md)
+- [昆仑芯XPU部署环境](xpu.md)
 
 
 ## FastDeploy编译选项说明
@@ -20,10 +21,11 @@
 | 选项                      | 说明                                                                        |
 |:------------------------|:--------------------------------------------------------------------------|
 | ENABLE_ORT_BACKEND      | 默认OFF, 是否编译集成ONNX Runtime后端(CPU/GPU上推荐打开)                                 |
-| ENABLE_PADDLE_BACKEND   | 默认OFF，是否编译集成Paddle Inference后端(CPU/GPU上推荐打开)                              |  
-| ENABLE_LITE_BACKEND     | 默认OFF，是否编译集成Paddle Lite后端(编译Android库时需要设置为ON)                             |
+| ENABLE_PADDLE_BACKEND   | 默认OFF，是否编译集成Paddle Inference后端(CPU/GPU上推荐打开)                             |  
+| ENABLE_LITE_BACKEND     | 默认OFF，是否编译集成Paddle Lite后端(编译Android库时需要设置为ON)                          |
 | ENABLE_RKNPU2_BACKEND   | 默认OFF，是否编译集成RKNPU2后端(RK3588/RK3568/RK3566上推荐打开)                           |
-| WITH_TIMVX            | 默认OFF，需要在RV1126/RV1109/A311D上部署时，需设置为ON                                   |
+| WITH_XPU                | 默认OFF，当在昆仑芯XPU上部署时，需设置为ON                                                |
+| WITH_TIMVX              | 默认OFF，需要在RV1126/RV1109/A311D上部署时，需设置为ON                                   |
 | ENABLE_TRT_BACKEND      | 默认OFF，是否编译集成TensorRT后端(GPU上推荐打开)                                          |
 | ENABLE_OPENVINO_BACKEND | 默认OFF，是否编译集成OpenVINO后端(CPU上推荐打开)                                          |
 | ENABLE_VISION           | 默认OFF，是否编译集成视觉模型的部署模块                                                     |
diff --git a/docs/cn/build_and_install/a311d.md b/docs/cn/build_and_install/a311d.md
index 4b3773f0d..20dde7046 100755
--- a/docs/cn/build_and_install/a311d.md
+++ b/docs/cn/build_and_install/a311d.md
@@ -9,7 +9,8 @@ FastDeploy 基于 Paddle-Lite 后端支持在晶晨 NPU 上进行部署推理。
 |编译选项|默认值|说明|备注|  
 |:---|:---|:---|:---|  
 |ENABLE_LITE_BACKEND|OFF|编译A311D部署库时需要设置为ON| - |
-|WITH_TIMVX|OFF|编译A311D部署库时需要设置为ON| - |
+|WITH_TIMVX|OFF|编译A311D部署库时需要设置为ON| - |  
+|TARGET_ABI|NONE|编译RK库时需要设置为arm64| - |
 
 更多编译选项请参考[FastDeploy编译选项说明](./README.md)
 
diff --git a/docs/cn/build_and_install/rv1126.md b/docs/cn/build_and_install/rv1126.md
index ff0050715..f3643f070 100755
--- a/docs/cn/build_and_install/rv1126.md
+++ b/docs/cn/build_and_install/rv1126.md
@@ -8,8 +8,9 @@ FastDeploy基于 Paddle-Lite 后端支持在瑞芯微（Rockchip）Soc 上进行
 相关编译选项说明如下：  
 |编译选项|默认值|说明|备注|  
 |:---|:---|:---|:---|  
-|ENABLE_LITE_BACKEND|OFF|编译RK库时需要设置为ON| - |
-|WITH_TIMVX|OFF|编译RK库时需要设置为ON| - |
+|ENABLE_LITE_BACKEND|OFF|编译RK库时需要设置为ON| - |  
+|WITH_TIMVX|OFF|编译RK库时需要设置为ON| - |  
+|TARGET_ABI|NONE|编译RK库时需要设置为armhf| - |
 
 更多编译选项请参考[FastDeploy编译选项说明](./README.md)
 
@@ -86,7 +87,7 @@ dmesg | grep Galcore
 wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
 tar -xf PaddleLite-generic-demo.tar.gz
 ```
-2. 使用 `uname -a` 查看 `Linux Kernel` 版本，确定为 `Linux` 系统 4.19.111 版本，
+2. 使用 `uname -a` 查看 `Linux Kernel` 版本，确定为 `Linux` 系统 4.19.111 版本
 3. 将 `PaddleLite-generic-demo/libs/PaddleLite/linux/armhf/lib/verisilicon_timvx/viv_sdk_6_4_6_5/lib/1126/4.19.111/` 路径下的 `galcore.ko` 上传至开发板。
 
 4. 登录开发板，命令行输入 `sudo rmmod galcore` 来卸载原始驱动，输入 `sudo insmod galcore.ko` 来加载传上设备的驱动。（是否需要 sudo 根据开发板实际情况，部分 adb 链接的设备请提前 adb root）。此步骤如果操作失败，请跳转至方法 2。
diff --git a/docs/cn/build_and_install/xpu.md b/docs/cn/build_and_install/xpu.md
new file mode 100755
index 000000000..014eb804d
--- /dev/null
+++ b/docs/cn/build_and_install/xpu.md
@@ -0,0 +1,75 @@
+# 昆仑芯 XPU 部署环境编译安装
+
+FastDeploy 基于 Paddle-Lite 后端支持在昆仑芯 XPU 上进行部署推理。
+更多详细的信息请参考：[PaddleLite部署示例](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/kunlunxin_xpu.html#xpu)。
+
+本文档介绍如何编译基于 PaddleLite 的 C++ FastDeploy 编译库。
+
+相关编译选项说明如下：  
+|编译选项|默认值|说明|备注|  
+|:---|:---|:---|:---|  
+| WITH_XPU| OFF | 需要在XPU上部署时需要设置为ON | - |
+| ENABLE_ORT_BACKEND | OFF | 是否编译集成ONNX Runtime后端 | - |
+| ENABLE_PADDLE_BACKEND | OFF | 是否编译集成Paddle Inference后端 | - |
+| ENABLE_OPENVINO_BACKEND | OFF | 是否编译集成OpenVINO后端 | - |
+| ENABLE_VISION | OFF | 是否编译集成视觉模型的部署模块 | - |
+| ENABLE_TEXT | OFF | 是否编译集成文本NLP模型的部署模块 | - |
+
+第三方库依赖指定（不设定如下参数，会自动下载预编译库）
+| 选项                     | 说明                                                                                           |
+| :---------------------- | :--------------------------------------------------------------------------------------------- |
+| ORT_DIRECTORY           | 当开启ONNX Runtime后端时，用于指定用户本地的ONNX Runtime库路径；如果不指定，编译过程会自动下载ONNX Runtime库  |
+| OPENCV_DIRECTORY        | 当ENABLE_VISION=ON时，用于指定用户本地的OpenCV库路径；如果不指定，编译过程会自动下载OpenCV库              |
+| OPENVINO_DIRECTORY      | 当开启OpenVINO后端时, 用于指定用户本地的OpenVINO库路径；如果不指定，编译过程会自动下载OpenVINO库             |
+更多编译选项请参考[FastDeploy编译选项说明](./README.md)
+
+## 基于 PaddleLite 的 C++ FastDeploy 库编译
+- OS: Linux
+- gcc/g++: version >= 8.2
+- cmake: version >= 3.15
+此外更推荐开发者自行安装，编译时通过`-DOPENCV_DIRECTORY`来指定环境中的OpenCV（如若不指定-DOPENCV_DIRECTORY，会自动下载FastDeploy提供的预编译的OpenCV，但在**Linux平台**无法支持Video的读取，以及imshow等可视化界面功能）
+```
+sudo apt-get install libopencv-dev
+```
+编译命令如下：
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with KunlunXin xpu toolchain
+cmake -DWITH_XPU=ON  \
+      -DWITH_GPU=OFF  \ # 不编译 GPU
+      -DENABLE_ORT_BACKEND=ON  \ # 可选择开启 ORT 后端
+      -DENABLE_PADDLE_BACKEND=ON  \ # 可选择开启 Paddle 后端
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-xpu \
+      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
+      -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
+      ..
+
+# Build FastDeploy KunlunXin XPU C++ SDK
+make -j8
+make install
+```  
+编译完成之后，会生成 fastdeploy-xpu 目录，表示基于 PadddleLite 的 FastDeploy 库编译完成。
+
+## Python 编译
+编译命令如下：
+```bash
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/python
+export WITH_XPU=ON
+export WITH_GPU=OFF
+export ENABLE_ORT_BACKEND=ON
+export ENABLE_PADDLE_BACKEND=ON
+export ENABLE_VISION=ON
+# OPENCV_DIRECTORY可选，不指定会自动下载FastDeploy提供的预编译OpenCV库
+export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
+
+python setup.py build
+python setup.py bdist_wheel
+```  
+编译完成即会在 `FastDeploy/python/dist` 目录下生成编译后的 `wheel` 包，直接 pip install 即可
+
+编译过程中，如若修改编译参数，为避免带来缓存影响，可删除 `FastDeploy/python` 目录下的 `build` 和 `.setuptools-cmake-build` 两个子目录后再重新编译
diff --git a/docs/en/build_and_install/README.md b/docs/en/build_and_install/README.md
old mode 100644
new mode 100755
index 4beaaeec8..0958c3778
--- a/docs/en/build_and_install/README.md
+++ b/docs/en/build_and_install/README.md
@@ -12,6 +12,9 @@ English | [中文](../../cn/build_and_install/README.md)
 - [Build and Install on IPU Platform](ipu.md)
 - [Build and Install on Nvidia Jetson Platform](jetson.md)
 - [Build and Install on Android Platform](android.md)
+- [Build and Install on RV1126 Platform](rv1126.md)
+- [Build and Install on A311D Platform](a311d.md)
+- [Build and Install on KunlunXin XPU Platform](xpu.md)
 
 
 ## Build options
@@ -25,6 +28,8 @@ English | [中文](../../cn/build_and_install/README.md)
 | ENABLE_VISION | Default OFF，whether to enable vision models deployment module |
 | ENABLE_TEXT | Default OFF，whether to enable text models deployment module |
 | WITH_GPU | Default OFF, if build on GPU, this need to be ON |
+| WITH_XPU | Default OFF，if deploy on KunlunXin XPU，this need to be ON |
+| WITH_TIMVX | Default OFF，if deploy on RV1126/RV1109/A311D，this need to be ON |
 | CUDA_DIRECTORY | Default /usr/local/cuda, if build on GPU, this defines the path of CUDA(>=11.2) |
 | TRT_DIRECTORY | If build with ENABLE_TRT_BACKEND=ON, this defines the path of TensorRT(>=8.4) |
 | ORT_DIRECTORY | [Optional] If build with ENABLE_ORT_BACKEND=ON, this flag defines the path of ONNX Runtime, but if this flag is not set, it will download ONNX Runtime library automatically |
diff --git a/docs/en/build_and_install/a311d.md b/docs/en/build_and_install/a311d.md
new file mode 100755
index 000000000..872c1b93c
--- /dev/null
+++ b/docs/en/build_and_install/a311d.md
@@ -0,0 +1,105 @@
+# How to Build A311D Deployment Environment
+
+FastDeploy supports AI deployment on Rockchip Soc based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html).
+
+This document describes how to compile the PaddleLite-based C++ FastDeploy cross-compilation library.
+
+The relevant compilation options are described as follows:  
+|Compile Options|Default Values|Description|Remarks|  
+|:---|:---|:---|:---|  
+|ENABLE_LITE_BACKEND|OFF|It needs to be set to ON when compiling the A311D library| - |  
+|WITH_TIMVX|OFF|It needs to be set to ON when compiling the A311D library| - |  
+|TARGET_ABI|NONE|It needs to be set to arm64 when compiling the A311D library| - |  
+
+For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
+
+## Cross-compilation environment construction
+
+### Host Environment Requirements  
+- os：Ubuntu == 16.04
+- cmake： version >= 3.10.0  
+
+### Building the compilation environment
+You can enter the FastDeploy/tools/timvx directory and use the following command to install:
+```bash
+cd FastDeploy/tools/timvx
+bash install.sh
+```
+You can also install it with the following commands:
+```bash
+ # 1. Install basic software
+apt update
+apt-get install -y --no-install-recommends \
+  gcc g++ git make wget python unzip
+
+# 2. Install arm gcc toolchains
+apt-get install -y --no-install-recommends \
+  g++-arm-linux-gnueabi gcc-arm-linux-gnueabi \
+  g++-arm-linux-gnueabihf gcc-arm-linux-gnueabihf \
+  gcc-aarch64-linux-gnu g++-aarch64-linux-gnu
+
+# 3. Install cmake 3.10 or above
+wget -c https://mms-res.cdn.bcebos.com/cmake-3.10.3-Linux-x86_64.tar.gz && \
+  tar xzf cmake-3.10.3-Linux-x86_64.tar.gz && \
+  mv cmake-3.10.3-Linux-x86_64 /opt/cmake-3.10 && \
+  ln -s /opt/cmake-3.10/bin/cmake /usr/bin/cmake && \
+  ln -s /opt/cmake-3.10/bin/ccmake /usr/bin/ccmake
+```
+
+## FastDeploy cross-compilation library compilation based on PaddleLite
+After setting up the cross-compilation environment, the compilation command is as follows:
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with A311D toolchain
+cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/toolchain.cmake \
+      -DWITH_TIMVX=ON  \
+      -DTARGET_ABI=arm64 \
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-tmivx \
+      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
+      -Wno-dev ..
+
+# Build FastDeploy A311D C++ SDK
+make -j8
+make install
+```  
+After the compilation is complete, the fastdeploy-tmivx directory will be generated, indicating that the FastDeploy library based on PadddleLite TIM-VX has been compiled.
+
+## Prepare the Soc environment
+Before deployment, ensure that the version of the driver galcore.so of the Verisilicon Linux Kernel NPU meets the requirements. Before deployment, please log in to the development board, and enter the following command through the command line to query the NPU driver version. The recommended version of the Rockchip driver is: 6.4.4.3
+```bash
+dmesg | grep Galcore
+```  
+If the current version does not comply with the above, please read the following content carefully to ensure that the underlying NPU driver environment is correct.
+
+There are two ways to modify the current NPU driver version:
+1. Manually replace the NPU driver version. (recommend)
+2. flash the machine, and flash the firmware that meets the requirements of the NPU driver version.
+
+### Manually replace the NPU driver version
+1. Use the following command to download and decompress the PaddleLite demo, which provides ready-made driver files
+```bash
+wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
+tar -xf PaddleLite-generic-demo.tar.gz
+```
+2. Use `uname -a` to check `Linux Kernel` version, it is determined to be version 4.19.111.
+3. Upload `galcore.ko` under `PaddleLite-generic-demo/libs/PaddleLite/linux/arm64/lib/verisilicon_timvx/viv_sdk_6_4_4_3/lib/a311d/4.9.113` path to the development board.
+4. Log in to the development board, enter `sudo rmmod galcore` on the command line to uninstall the original driver, and enter `sudo insmod galcore.ko` to load the uploaded device driver. (Whether sudo is needed depends on the actual situation of the development board. For some adb-linked devices, please adb root in advance). If this step fails, go to method 2.
+5. Enter `dmesg | grep Galcore` in the development board to query the NPU driver version, and it is determined to be: 6.4.4.3
+
+### flash
+According to the specific development board model, ask the development board seller or the official website customer service for the firmware and flashing method corresponding to the 6.4.4.3 version of the NPU driver.
+
+For more details, please refer to: [PaddleLite prepares the device environment](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html#zhunbeishebeihuanjing)
+
+## Deployment example based on FastDeploy on A311D
+1. For deploying the PaddleClas classification model on A311D, please refer to: [C++ deployment example of PaddleClas classification model on A311D](../../../examples/vision/classification/paddleclas/a311d/README.md)
+
+2. For deploying PPYOLOE detection model on A311D, please refer to: [C++ deployment example of PPYOLOE detection model on A311D](../../../examples/vision/detection/paddledetection/a311d/README.md)
+
+3. For deploying YOLOv5 detection model on A311D, please refer to: [C++ Deployment Example of YOLOv5 Detection Model on A311D](../../../examples/vision/detection/yolov5/a311d/README.md)
+
+4. For deploying PP-LiteSeg segmentation model on A311D, please refer to: [C++ Deployment Example of PP-LiteSeg Segmentation Model on A311D](../../../examples/vision/segmentation/paddleseg/a311d/README.md)
diff --git a/docs/en/build_and_install/rv1126.md b/docs/en/build_and_install/rv1126.md
new file mode 100755
index 000000000..a56535363
--- /dev/null
+++ b/docs/en/build_and_install/rv1126.md
@@ -0,0 +1,105 @@
+# How to Build RV1126 Deployment Environment
+
+FastDeploy supports AI deployment on Rockchip Soc based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html).
+
+This document describes how to compile the PaddleLite-based C++ FastDeploy cross-compilation library.
+
+The relevant compilation options are described as follows:  
+|Compile Options|Default Values|Description|Remarks|  
+|:---|:---|:---|:---|  
+|ENABLE_LITE_BACKEND|OFF|It needs to be set to ON when compiling the RK library| - |  
+|WITH_TIMVX|OFF|It needs to be set to ON when compiling the RK library| - |  
+|TARGET_ABI|NONE|It needs to be set to armhf when compiling the RK library| - |  
+
+For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
+
+## Cross-compilation environment construction
+
+### Host Environment Requirements  
+- os：Ubuntu == 16.04
+- cmake： version >= 3.10.0  
+
+### Building the compilation environment
+You can enter the FastDeploy/tools/timvx directory and use the following command to install:
+```bash
+cd FastDeploy/tools/timvx
+bash install.sh
+```
+You can also install it with the following commands:
+```bash
+ # 1. Install basic software
+apt update
+apt-get install -y --no-install-recommends \
+  gcc g++ git make wget python unzip
+
+# 2. Install arm gcc toolchains
+apt-get install -y --no-install-recommends \
+  g++-arm-linux-gnueabi gcc-arm-linux-gnueabi \
+  g++-arm-linux-gnueabihf gcc-arm-linux-gnueabihf \
+  gcc-aarch64-linux-gnu g++-aarch64-linux-gnu
+
+# 3. Install cmake 3.10 or above
+wget -c https://mms-res.cdn.bcebos.com/cmake-3.10.3-Linux-x86_64.tar.gz && \
+  tar xzf cmake-3.10.3-Linux-x86_64.tar.gz && \
+  mv cmake-3.10.3-Linux-x86_64 /opt/cmake-3.10 && \
+  ln -s /opt/cmake-3.10/bin/cmake /usr/bin/cmake && \
+  ln -s /opt/cmake-3.10/bin/ccmake /usr/bin/ccmake
+```
+
+## FastDeploy cross-compilation library compilation based on PaddleLite
+After setting up the cross-compilation environment, the compilation command is as follows:
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with RK toolchain
+cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/toolchain.cmake \
+      -DWITH_TIMVX=ON  \
+      -DTARGET_ABI=armhf \
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-tmivx \
+      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
+      -Wno-dev ..
+
+# Build FastDeploy RV1126 C++ SDK
+make -j8
+make install
+```  
+After the compilation is complete, the fastdeploy-tmivx directory will be generated, indicating that the FastDeploy library based on PadddleLite TIM-VX has been compiled.
+
+## Prepare the Soc environment
+Before deployment, ensure that the version of the driver galcore.so of the Verisilicon Linux Kernel NPU meets the requirements. Before deployment, please log in to the development board, and enter the following command through the command line to query the NPU driver version. The recommended version of the Rockchip driver is: 6.4.6.5
+```bash
+dmesg | grep Galcore
+```  
+If the current version does not comply with the above, please read the following content carefully to ensure that the underlying NPU driver environment is correct.
+
+There are two ways to modify the current NPU driver version:
+1. Manually replace the NPU driver version. (recommend)
+2. flash the machine, and flash the firmware that meets the requirements of the NPU driver version.
+
+### Manually replace the NPU driver version
+1. Use the following command to download and decompress the PaddleLite demo, which provides ready-made driver files
+```bash
+wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
+tar -xf PaddleLite-generic-demo.tar.gz
+```
+2. Use `uname -a` to check `Linux Kernel` version, it is determined to be version 4.19.111.
+3. Upload `galcore.ko` under `PaddleLite-generic-demo/libs/PaddleLite/linux/armhf/lib/verisilicon_timvx/viv_sdk_6_4_6_5/lib/1126/4.19.111/` path to the development board.
+4. Log in to the development board, enter `sudo rmmod galcore` on the command line to uninstall the original driver, and enter `sudo insmod galcore.ko` to load the uploaded device driver. (Whether sudo is needed depends on the actual situation of the development board. For some adb-linked devices, please adb root in advance). If this step fails, go to method 2.
+5. Enter `dmesg | grep Galcore` in the development board to query the NPU driver version, and it is determined to be: 6.4.6.5
+
+### flash
+According to the specific development board model, ask the development board seller or the official website customer service for the firmware and flashing method corresponding to the 6.4.6.5 version of the NPU driver.
+
+For more details, please refer to: [PaddleLite prepares the device environment](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html#zhunbeishebeihuanjing)
+
+## Deployment example based on FastDeploy on RV1126
+1. For deploying the PaddleClas classification model on RV1126, please refer to: [C++ deployment example of PaddleClas classification model on RV1126](../../../examples/vision/classification/paddleclas/rv1126/README.md)
+
+2. For deploying PPYOLOE detection model on RV1126, please refer to: [C++ deployment example of PPYOLOE detection model on RV1126](../../../examples/vision/detection/paddledetection/rv1126/README.md)
+
+3. For deploying YOLOv5 detection model on RV1126, please refer to: [C++ Deployment Example of YOLOv5 Detection Model on RV1126](../../../examples/vision/detection/yolov5/rv1126/README.md)
+
+4. For deploying PP-LiteSeg segmentation model on RV1126, please refer to: [C++ Deployment Example of PP-LiteSeg Segmentation Model on RV1126](../../../examples/vision/segmentation/paddleseg/rv1126/README.md)
diff --git a/docs/en/build_and_install/xpu.md b/docs/en/build_and_install/xpu.md
new file mode 100755
index 000000000..403837e5d
--- /dev/null
+++ b/docs/en/build_and_install/xpu.md
@@ -0,0 +1,78 @@
+# How to Build KunlunXin XPU Deployment Environment
+
+FastDeploy supports deployment AI on KunlunXin XPU based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/kunlunxin_xpu.html#xpu)。
+
+This document describes how to compile the C++ FastDeploy library based on PaddleLite.
+
+The relevant compilation options are described as follows:  
+|Compile Options|Default Values|Description|Remarks|  
+|:---|:---|:---|:---|  
+| ENABLE_LITE_BACKEND | OFF | It needs to be set to ON when compiling the RK library| - |  
+| WITH_XPU | OFF | It needs to be set to ON when compiling the KunlunXin XPU library| - |
+| ENABLE_ORT_BACKEND | OFF | whether to intergrate ONNX Runtime backend | - |
+| ENABLE_PADDLE_BACKEND | OFF | whether to intergrate Paddle Inference backend | - |
+| ENABLE_OPENVINO_BACKEND | OFF | whether to intergrate OpenVINO backend | - |
+| ENABLE_VISION | OFF | whether to intergrate vision models | - |
+| ENABLE_TEXT | OFF | whether to intergrate text models | - |
+
+The configuration for third libraries(Optional, if the following option is not defined, the prebuilt third libraries will download automaticly while building FastDeploy).
+| Option                     | Description                                                                                           |
+| :---------------------- | :--------------------------------------------------------------------------------------------- |
+| ORT_DIRECTORY           | While ENABLE_ORT_BACKEND=ON, use ORT_DIRECTORY to specify your own ONNX Runtime library path.  |
+| OPENCV_DIRECTORY        | While ENABLE_VISION=ON, use OPENCV_DIRECTORY to specify your own OpenCV library path.     |
+| OPENVINO_DIRECTORY      |  While ENABLE_OPENVINO_BACKEND=ON, use OPENVINO_DIRECTORY to specify your own OpenVINO library path.    |
+
+For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
+
+## C++ FastDeploy library compilation based on PaddleLite
+- OS: Linux
+- gcc/g++: version >= 8.2
+- cmake: version >= 3.15
+
+It it recommend install OpenCV library manually, and define `-DOPENCV_DIRECTORY` to set path of OpenCV library(If the flag is not defined, a prebuilt OpenCV library will be downloaded automaticly while building FastDeploy, but the prebuilt OpenCV cannot support reading video file or other function e.g `imshow`)
+```
+sudo apt-get install libopencv-dev
+```
+
+The compilation command is as follows:
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with KunlunXin xpu toolchain
+cmake -DWITH_XPU=ON  \
+      -DWITH_GPU=OFF  \
+      -DENABLE_ORT_BACKEND=ON  \
+      -DENABLE_PADDLE_BACKEND=ON  \
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-xpu \
+      -DENABLE_VISION=ON \
+      -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
+      ..
+
+# Build FastDeploy KunlunXin XPU C++ SDK
+make -j8
+make install
+```  
+After the compilation is complete, the fastdeploy-xpu directory will be generated, indicating that the PadddleLite-based FastDeploy library has been compiled.
+
+## Python compile
+The compilation command is as follows:
+```bash
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/python
+export WITH_XPU=ON
+export WITH_GPU=OFF
+export ENABLE_ORT_BACKEND=ON
+export ENABLE_PADDLE_BACKEND=ON
+export ENABLE_VISION=ON
+# The OPENCV_DIRECTORY is optional, if not exported, a prebuilt OpenCV library will be downloaded
+export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
+
+python setup.py build
+python setup.py bdist_wheel
+```  
+After the compilation is completed, the compiled `wheel` package will be generated in the `FastDeploy/python/dist` directory, just pip install it directly
+
+During the compilation process, if you modify the compilation parameters, in order to avoid the cache impact, you can delete the two subdirectories `build` and `.setuptools-cmake-build` under the `FastDeploy/python` directory and then recompile.
diff --git a/examples/vision/classification/paddleclas/cpp/README.md b/examples/vision/classification/paddleclas/cpp/README.md
old mode 100644
new mode 100755
index 066340467..dff76da18
--- a/examples/vision/classification/paddleclas/cpp/README.md
+++ b/examples/vision/classification/paddleclas/cpp/README.md
@@ -30,6 +30,10 @@ wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/Ima
 ./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 1
 # GPU上TensorRT推理
 ./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 2
+# IPU推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 3
+# KunlunXin XPU推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 4
 ```
 
 以上命令只适用于Linux或MacOS, Windows下SDK的使用方式请参考:  
diff --git a/examples/vision/classification/paddleclas/cpp/infer.cc b/examples/vision/classification/paddleclas/cpp/infer.cc
old mode 100644
new mode 100755
index bdd87ecdc..244accfa7
--- a/examples/vision/classification/paddleclas/cpp/infer.cc
+++ b/examples/vision/classification/paddleclas/cpp/infer.cc
@@ -96,6 +96,32 @@ void IpuInfer(const std::string& model_dir, const std::string& image_file) {
   std::cout << res.Str() << std::endl;
 }
 
+void XpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "inference.pdmodel";
+  auto params_file = model_dir + sep + "inference.pdiparams";
+  auto config_file = model_dir + sep + "inference_cls.yaml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseXpu();
+  auto model = fastdeploy::vision::classification::PaddleClasModel(
+      model_file, params_file, config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::ClassifyResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  // print res
+  std::cout << res.Str() << std::endl;
+}
+
 void TrtInfer(const std::string& model_dir, const std::string& image_file) {
   auto model_file = model_dir + sep + "inference.pdmodel";
   auto params_file = model_dir + sep + "inference.pdiparams";
@@ -128,7 +154,7 @@ int main(int argc, char* argv[]) {
                  "e.g ./infer_demo ./ResNet50_vd ./test.jpeg 0"
               << std::endl;
     std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
-                 "with gpu; 2: run with gpu and use tensorrt backend."
+                 "with gpu; 2: run with gpu and use tensorrt backend; 3: run with ipu; 4: run with xpu."
               << std::endl;
     return -1;
   }
@@ -141,6 +167,8 @@ int main(int argc, char* argv[]) {
     TrtInfer(argv[1], argv[2]);
   } else if (std::atoi(argv[3]) == 3) {
     IpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 4) {
+    XpuInfer(argv[1], argv[2]);
   }
   return 0;
 }
diff --git a/examples/vision/classification/paddleclas/python/README.md b/examples/vision/classification/paddleclas/python/README.md
old mode 100644
new mode 100755
index 9d17e6f65..5a1baff7f
--- a/examples/vision/classification/paddleclas/python/README.md
+++ b/examples/vision/classification/paddleclas/python/README.md
@@ -25,6 +25,8 @@ python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg -
 python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device gpu --use_trt True --topk 1
 # IPU推理（注意：IPU推理首次运行会有序列化模型的操作，有一定耗时，需要耐心等待）
 python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device ipu --topk 1
+# XPU推理
+python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device xpu --topk 1
 ```
 
 运行完成后返回结果如下所示
diff --git a/examples/vision/classification/paddleclas/python/infer.py b/examples/vision/classification/paddleclas/python/infer.py
old mode 100644
new mode 100755
index 0b2d35a21..3c150533c
--- a/examples/vision/classification/paddleclas/python/infer.py
+++ b/examples/vision/classification/paddleclas/python/infer.py
@@ -35,6 +35,9 @@ def build_option(args):
     if args.device.lower() == "ipu":
         option.use_ipu()
 
+    if args.device.lower() == "xpu":
+        option.use_xpu()
+
     if args.use_trt:
         option.use_trt_backend()
     return option
diff --git a/examples/vision/detection/yolov5/cpp/CMakeLists.txt b/examples/vision/detection/yolov5/cpp/CMakeLists.txt
old mode 100644
new mode 100755
index 93540a7e8..2b3f8c54f
--- a/examples/vision/detection/yolov5/cpp/CMakeLists.txt
+++ b/examples/vision/detection/yolov5/cpp/CMakeLists.txt
@@ -12,3 +12,7 @@ include_directories(${FASTDEPLOY_INCS})
 add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
 # 添加FastDeploy库依赖
 target_link_libraries(infer_demo ${FASTDEPLOY_LIBS})
+
+add_executable(infer_paddle_demo ${PROJECT_SOURCE_DIR}/infer_paddle_model.cc)
+# 添加FastDeploy库依赖
+target_link_libraries(infer_paddle_demo ${FASTDEPLOY_LIBS})
diff --git a/examples/vision/detection/yolov5/cpp/README.md b/examples/vision/detection/yolov5/cpp/README.md
old mode 100644
new mode 100755
index ece3826a5..581f1c49b
--- a/examples/vision/detection/yolov5/cpp/README.md
+++ b/examples/vision/detection/yolov5/cpp/README.md
@@ -12,16 +12,33 @@
 ```bash
 mkdir build
 cd build
-# 下载FastDeploy预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
+# 下载 FastDeploy 预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
 wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz
 tar xvf fastdeploy-linux-x64-x.x.x.tgz
 cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
 make -j
-#下载官方转换好的yolov5模型文件和测试图片
-wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx
+#下载官方转换好的 yolov5 Paddle 模型文件和测试图片
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s_infer.tar
+tar -xvf yolov5s_infer.tar
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
 
+# CPU推理
+./infer_paddle_demo yolov5s_infer 000000014439.jpg 0
+# GPU推理
+./infer_paddle_demo yolov5s_infer 000000014439.jpg 1
+# GPU上TensorRT推理
+./infer_paddle_demo yolov5s_infer 000000014439.jpg 2
+# XPU推理
+./infer_paddle_demo yolov5s_infer 000000014439.jpg 3
+```
+
+上述的模型为 Paddle 模型的推理，如果想要做 ONNX 模型的推理，可以按照如下步骤：
+```bash
+# 1. 下载官方转换好的 yolov5 ONNX 模型文件和测试图片
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+
 # CPU推理
 ./infer_demo yolov5s.onnx 000000014439.jpg 0
 # GPU推理
@@ -29,7 +46,6 @@ wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/0000000
 # GPU上TensorRT推理
 ./infer_demo yolov5s.onnx 000000014439.jpg 2
 ```
-
 运行完成可视化结果如下图所示
 
 <img width="640" src="https://user-images.githubusercontent.com/67993288/184309358-d803347a-8981-44b6-b589-4608021ad0f4.jpg">
diff --git a/examples/vision/detection/yolov5/cpp/infer.cc b/examples/vision/detection/yolov5/cpp/infer.cc
old mode 100644
new mode 100755
index 1c3907918..fb20686de
--- a/examples/vision/detection/yolov5/cpp/infer.cc
+++ b/examples/vision/detection/yolov5/cpp/infer.cc
@@ -102,4 +102,4 @@ int main(int argc, char* argv[]) {
     TrtInfer(argv[1], argv[2]);
   }
   return 0;
-}
+}
\ No newline at end of file
diff --git a/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc b/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
new file mode 100755
index 000000000..d5692ce7c
--- /dev/null
+++ b/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
@@ -0,0 +1,154 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void CpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  fastdeploy::RuntimeOption option;
+  option.UseCpu();
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
+
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void GpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
+
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void TrtInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UseTrtBackend();
+  option.SetTrtInputShape("images", {1, 3, 640, 640});
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im, res);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void XpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  fastdeploy::RuntimeOption option;
+  option.UseXpu();
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
+
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 4) {
+    std::cout << "Usage: infer_demo path/to/model path/to/image run_option, "
+                 "e.g ./infer_model ./yolov5s_infer ./test.jpeg 0"
+              << std::endl;
+    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
+                 "with gpu; 2: run with gpu and use tensorrt backend; 3: run with KunlunXin XPU."
+              << std::endl;
+    return -1;
+  }
+
+  if (std::atoi(argv[3]) == 0) {
+    CpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 1) {
+    GpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 2) {
+    TrtInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 3) {
+    XpuInfer(argv[1], argv[2]);
+  }
+  return 0;
+}
diff --git a/examples/vision/detection/yolov5/python/README.md b/examples/vision/detection/yolov5/python/README.md
old mode 100644
new mode 100755
index 4f47b3084..83f6ed781
--- a/examples/vision/detection/yolov5/python/README.md
+++ b/examples/vision/detection/yolov5/python/README.md
@@ -13,15 +13,18 @@ git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd examples/vision/detection/yolov5/python/
 
 #下载yolov5模型文件和测试图片
-wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s_infer.tar
+tar -xf yolov5s_infer.tar
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
 # CPU推理
-python infer.py --model yolov5s.onnx --image 000000014439.jpg --device cpu
+python infer.py --model yolov5s_infer --image 000000014439.jpg --device cpu
 # GPU推理
-python infer.py --model yolov5s.onnx --image 000000014439.jpg --device gpu
+python infer.py --model yolov5s_infer --image 000000014439.jpg --device gpu
 # GPU上使用TensorRT推理
-python infer.py --model yolov5s.onnx --image 000000014439.jpg --device gpu --use_trt True
+python infer.py --model yolov5s_infer --image 000000014439.jpg --device gpu --use_trt True
+# XPU推理
+python infer.py --model yolov5s_infer --image 000000014439.jpg --device xpu
 ```
 
 运行完成可视化结果如下图所示
diff --git a/examples/vision/detection/yolov5/python/infer.py b/examples/vision/detection/yolov5/python/infer.py
old mode 100644
new mode 100755
index 462740e9c..b155af0ed
--- a/examples/vision/detection/yolov5/python/infer.py
+++ b/examples/vision/detection/yolov5/python/infer.py
@@ -1,20 +1,20 @@
 import fastdeploy as fd
 import cv2
+import os
 
 
 def parse_arguments():
     import argparse
     import ast
     parser = argparse.ArgumentParser()
-    parser.add_argument(
-        "--model", default=None, help="Path of yolov5 onnx model.")
+    parser.add_argument("--model", default=None, help="Path of yolov5 model.")
     parser.add_argument(
         "--image", default=None, help="Path of test image file.")
     parser.add_argument(
         "--device",
         type=str,
         default='cpu',
-        help="Type of inference device, support 'cpu' or 'gpu'.")
+        help="Type of inference device, support 'cpu' or 'gpu' or 'xpu'.")
     parser.add_argument(
         "--use_trt",
         type=ast.literal_eval,
@@ -25,6 +25,8 @@ def parse_arguments():
 
 def build_option(args):
     option = fd.RuntimeOption()
+    if args.device.lower() == "xpu":
+        option.use_xpu()
 
     if args.device.lower() == "gpu":
         option.use_gpu()
@@ -37,14 +39,15 @@ def build_option(args):
 
 args = parse_arguments()
 
-if args.model is None:
-    model = fd.download_model(name='YOLOv5s')
-else:
-    model = args.model
-
 # 配置runtime，加载模型
 runtime_option = build_option(args)
-model = fd.vision.detection.YOLOv5(model, runtime_option=runtime_option)
+model_file = os.path.join(args.model, "model.pdmodel")
+params_file = os.path.join(args.model, "model.pdiparams")
+model = fd.vision.detection.YOLOv5(
+    model_file,
+    params_file,
+    runtime_option=runtime_option,
+    model_format=fd.ModelFormat.PADDLE)
 
 # 预测图片检测结果
 if args.image is None:
diff --git a/fastdeploy/backends/lite/lite_backend.cc b/fastdeploy/backends/lite/lite_backend.cc
index 7e3e09f8d..20afa5e28 100755
--- a/fastdeploy/backends/lite/lite_backend.cc
+++ b/fastdeploy/backends/lite/lite_backend.cc
@@ -43,24 +43,33 @@ void LiteBackend::BuildOption(const LiteBackendOption& option) {
   option_ = option;
   std::vector<paddle::lite_api::Place> valid_places;
   if (option_.enable_int8) {
-    valid_places.push_back(
+    if(option_.enable_xpu) {
+      valid_places.push_back(
+          paddle::lite_api::Place{TARGET(kXPU), PRECISION(kInt8)});
+    } else {
+      valid_places.push_back(
         paddle::lite_api::Place{TARGET(kARM), PRECISION(kInt8)});
+    }
     FDINFO << "Lite::Backend enable_int8 option is ON ! Lite::Backend will "
            << "inference with int8 precision!" << std::endl;    
   }
   if (option_.enable_fp16) {
-    paddle::lite_api::MobileConfig check_fp16_config;
-    // Determine whether the device supports the FP16
-    // instruction set (or whether it is an arm device
-    // of the armv8.2 architecture)
-    supported_fp16_ = check_fp16_config.check_fp16_valid();
-    if (supported_fp16_) {
+    if(option_.enable_xpu){
       valid_places.push_back(
-          paddle::lite_api::Place{TARGET(kARM), PRECISION(kFP16)});
-      FDINFO << "Your device is supported fp16 ! Lite::Backend will "
-             << "inference with fp16 precision!" << std::endl;    
+          paddle::lite_api::Place{TARGET(kXPU), PRECISION(kFP16)});
     } else {
-      FDWARNING << "This device is not supported fp16, will skip fp16 option.";
+      paddle::lite_api::MobileConfig check_fp16_config;
+      // Determine whether the device supports the FP16
+      // instruction set (or whether it is an arm device
+      // of the armv8.2 architecture)
+      supported_fp16_ = check_fp16_config.check_fp16_valid();
+      if (supported_fp16_) {
+        valid_places.push_back(
+            paddle::lite_api::Place{TARGET(kARM), PRECISION(kFP16)});
+        FDINFO << "The device supports FP16, Lite::Backend will inference with FP16 precision." << std::endl;    
+      } else {
+        FDWARNING << "The device doesn't support FP16, will fallback to FP32.";
+      }
     }
   }
   if (!option_.nnadapter_subgraph_partition_config_path.empty()) {
@@ -81,8 +90,24 @@ void LiteBackend::BuildOption(const LiteBackendOption& option) {
     valid_places.push_back(
         paddle::lite_api::Place{TARGET(kARM), PRECISION(kInt8)});
   }
-  valid_places.push_back(
+  
+  if(option_.enable_xpu){
+    valid_places.push_back(
+      paddle::lite_api::Place{TARGET(kXPU), PRECISION(kFloat)});
+    valid_places.push_back(
+      paddle::lite_api::Place{TARGET(kX86), PRECISION(kFloat)});
+    config_.set_xpu_dev_per_thread(option_.device_id);
+    config_.set_xpu_workspace_l3_size_per_thread(option_.xpu_l3_workspace_size);
+    config_.set_xpu_l3_cache_method(option_.xpu_l3_workspace_size, option_.xpu_locked);
+    config_.set_xpu_conv_autotune(option_.xpu_autotune, option_.xpu_autotune_file);
+    config_.set_xpu_multi_encoder_method(option_.xpu_precision, option_.xpu_adaptive_seqlen);
+    if (option_.xpu_enable_multi_stream) {
+      config_.enable_xpu_multi_stream();
+    }
+  } else {
+    valid_places.push_back(
       paddle::lite_api::Place{TARGET(kARM), PRECISION(kFloat)});
+  }
   config_.set_valid_places(valid_places);
   if (option_.threads > 0) {
     config_.set_threads(option_.threads);
@@ -160,7 +185,9 @@ bool LiteBackend::InitFromPaddle(const std::string& model_file,
     auto shape = tensor->shape();
     info.shape.assign(shape.begin(), shape.end());
     info.name = output_names[i];
-    info.dtype = LiteDataTypeToFD(tensor->precision());
+    if(!option_.enable_xpu){
+      info.dtype = LiteDataTypeToFD(tensor->precision());
+    }
     outputs_desc_.emplace_back(info);
   }
 
@@ -239,6 +266,9 @@ bool LiteBackend::Infer(std::vector<FDTensor>& inputs,
   outputs->resize(outputs_desc_.size());
   for (size_t i = 0; i < outputs_desc_.size(); ++i) {
     auto tensor = predictor_->GetOutput(i);
+    if(outputs_desc_[i].dtype != LiteDataTypeToFD(tensor->precision())){
+      outputs_desc_[i].dtype = LiteDataTypeToFD(tensor->precision());
+    }
     (*outputs)[i].Resize(tensor->shape(), outputs_desc_[i].dtype,
                          outputs_desc_[i].name);
     memcpy((*outputs)[i].MutableData(), tensor->data<void>(),
diff --git a/fastdeploy/backends/lite/lite_backend.h b/fastdeploy/backends/lite/lite_backend.h
index 279acf5df..0221f507f 100755
--- a/fastdeploy/backends/lite/lite_backend.h
+++ b/fastdeploy/backends/lite/lite_backend.h
@@ -45,6 +45,15 @@ struct LiteBackendOption {
   // Such as fp16, different device target (kARM/kXPU/kNPU/...)
   std::string nnadapter_subgraph_partition_config_path = "";
   bool enable_timvx = false;
+  bool enable_xpu = false;
+  int device_id = 0;
+  int xpu_l3_workspace_size = 0xfffc00;
+  bool xpu_locked = false;
+  bool xpu_autotune = true;
+  std::string xpu_autotune_file = "";
+  std::string xpu_precision = "int16";
+  bool xpu_adaptive_seqlen = false;
+  bool xpu_enable_multi_stream = false;
 };
 
 // Convert data type from paddle lite to fastdeploy
diff --git a/fastdeploy/core/fd_type.cc b/fastdeploy/core/fd_type.cc
index ba3319dbc..3624b732d 100755
--- a/fastdeploy/core/fd_type.cc
+++ b/fastdeploy/core/fd_type.cc
@@ -62,6 +62,9 @@ std::string Str(const Device& d) {
     case Device::TIMVX:
       out = "Device::TIMVX";
       break;
+    case Device::XPU:
+      out = "Device::XPU";
+      break;
     default:
       out = "Device::UNKOWN";
   }
@@ -82,6 +85,9 @@ std::ostream& operator<<(std::ostream& out,const Device& d){
   case Device::TIMVX:
     out << "Device::TIMVX";
     break;
+  case Device::XPU:
+    out << "Device::XPU";
+    break;
   default:
     out << "Device::UNKOWN";
   }
diff --git a/fastdeploy/core/fd_type.h b/fastdeploy/core/fd_type.h
index ba18d8e36..d39c56fdf 100755
--- a/fastdeploy/core/fd_type.h
+++ b/fastdeploy/core/fd_type.h
@@ -22,7 +22,7 @@
 
 namespace fastdeploy {
 
-enum FASTDEPLOY_DECL Device { CPU, GPU, RKNPU, IPU, TIMVX};
+enum FASTDEPLOY_DECL Device { CPU, GPU, RKNPU, IPU, TIMVX, XPU};
 
 FASTDEPLOY_DECL std::string Str(const Device& d);
 
diff --git a/fastdeploy/fastdeploy_model.cc b/fastdeploy/fastdeploy_model.cc
index ad8c1329d..4d7a8e364 100755
--- a/fastdeploy/fastdeploy_model.cc
+++ b/fastdeploy/fastdeploy_model.cc
@@ -51,6 +51,7 @@ bool FastDeployModel::InitRuntimeWithSpecifiedBackend() {
   bool use_ipu = (runtime_option.device == Device::IPU);
   bool use_rknpu = (runtime_option.device == Device::RKNPU);
   bool use_timvx = (runtime_option.device == Device::TIMVX);
+  bool use_xpu = (runtime_option.device == Device::XPU);
 
   if (use_gpu) {
     if (!IsSupported(valid_gpu_backends, runtime_option.backend)) {
@@ -67,6 +68,11 @@ bool FastDeployModel::InitRuntimeWithSpecifiedBackend() {
       FDERROR << "The valid timvx backends of model " << ModelName() << " are " << Str(valid_timvx_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
       return false;
     }
+  } else if (use_xpu) {
+    if (!IsSupported(valid_xpu_backends, runtime_option.backend)) {
+      FDERROR << "The valid xpu backends of model " << ModelName() << " are " << Str(valid_xpu_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
+      return false;
+    }
   } else if(use_ipu) {
     if (!IsSupported(valid_ipu_backends, runtime_option.backend)) {
       FDERROR << "The valid ipu backends of model " << ModelName() << " are " << Str(valid_ipu_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
@@ -102,6 +108,8 @@ bool FastDeployModel::InitRuntimeWithSpecifiedDevice() {
     return CreateRKNPUBackend();
   } else if (runtime_option.device == Device::TIMVX) {
     return CreateTimVXBackend();
+  } else if (runtime_option.device == Device::XPU) {
+    return CreateXPUBackend();
   } else if (runtime_option.device == Device::IPU) {
 #ifdef WITH_IPU
     return CreateIpuBackend();
@@ -111,7 +119,7 @@ bool FastDeployModel::InitRuntimeWithSpecifiedDevice() {
     return false;
 #endif
   }
-  FDERROR << "Only support CPU/GPU/IPU/RKNPU/TIMVX now." << std::endl;
+  FDERROR << "Only support CPU/GPU/IPU/RKNPU/TIMVX/XPU now." << std::endl;
   return false;
 }
 
@@ -225,6 +233,29 @@ bool FastDeployModel::CreateTimVXBackend() {
   return false;
 }
 
+bool FastDeployModel::CreateXPUBackend() {
+  if (valid_xpu_backends.size() == 0) {
+    FDERROR << "There's no valid xpu backends for model: " << ModelName()
+            << std::endl;
+    return false;
+  }
+
+  for (size_t i = 0; i < valid_xpu_backends.size(); ++i) {
+    if (!IsBackendAvailable(valid_xpu_backends[i])) {
+      continue;
+    }
+    runtime_option.backend = valid_xpu_backends[i];
+    runtime_ = std::unique_ptr<Runtime>(new Runtime());
+    if (!runtime_->Init(runtime_option)) {
+      return false;
+    }
+    runtime_initialized_ = true;
+    return true;
+  }
+  FDERROR << "Found no valid backend for model: " << ModelName() << std::endl;
+  return false;
+}
+
 bool FastDeployModel::CreateIpuBackend() {
   if (valid_ipu_backends.size() == 0) {
     FDERROR << "There's no valid ipu backends for model: " << ModelName()
diff --git a/fastdeploy/fastdeploy_model.h b/fastdeploy/fastdeploy_model.h
index 5a6efba09..5c8809196 100755
--- a/fastdeploy/fastdeploy_model.h
+++ b/fastdeploy/fastdeploy_model.h
@@ -45,6 +45,9 @@ class FASTDEPLOY_DECL FastDeployModel {
   /** Model's valid timvx backends. This member defined all the timvx backends have successfully tested for the model
    */
   std::vector<Backend> valid_timvx_backends = {};
+  /** Model's valid KunlunXin xpu backends. This member defined all the KunlunXin xpu backends have successfully tested for the model
+   */
+  std::vector<Backend> valid_xpu_backends = {};
   /** Model's valid hardware backends. This member defined all the gpu backends have successfully tested for the model
    */
   std::vector<Backend> valid_rknpu_backends = {};
@@ -143,6 +146,7 @@ class FASTDEPLOY_DECL FastDeployModel {
   bool CreateIpuBackend();
   bool CreateRKNPUBackend();
   bool CreateTimVXBackend();
+  bool CreateXPUBackend();
 
   std::shared_ptr<Runtime> runtime_;
   bool runtime_initialized_ = false;
diff --git a/fastdeploy/pybind/runtime.cc b/fastdeploy/pybind/runtime.cc
old mode 100644
new mode 100755
index 75767c665..d0cb0b5f8
--- a/fastdeploy/pybind/runtime.cc
+++ b/fastdeploy/pybind/runtime.cc
@@ -23,6 +23,7 @@ void BindRuntime(pybind11::module& m) {
       .def("use_gpu", &RuntimeOption::UseGpu)
       .def("use_cpu", &RuntimeOption::UseCpu)
       .def("use_rknpu2", &RuntimeOption::UseRKNPU2)
+      .def("use_xpu", &RuntimeOption::UseXpu)
       .def("set_external_stream", &RuntimeOption::SetExternalStream)
       .def("set_cpu_thread_num", &RuntimeOption::SetCpuThreadNum)
       .def("use_paddle_backend", &RuntimeOption::UsePaddleBackend)
@@ -100,7 +101,21 @@ void BindRuntime(pybind11::module& m) {
       .def_readwrite("ipu_available_memory_proportion",
                      &RuntimeOption::ipu_available_memory_proportion)
       .def_readwrite("ipu_enable_half_partial",
-                     &RuntimeOption::ipu_enable_half_partial);
+                     &RuntimeOption::ipu_enable_half_partial)
+      .def_readwrite("xpu_l3_workspace_size",
+                     &RuntimeOption::xpu_l3_workspace_size)
+      .def_readwrite("xpu_locked",
+                     &RuntimeOption::xpu_locked)
+      .def_readwrite("xpu_autotune",
+                     &RuntimeOption::xpu_autotune)
+      .def_readwrite("xpu_autotune_file",
+                     &RuntimeOption::xpu_autotune_file)
+      .def_readwrite("xpu_precision",
+                     &RuntimeOption::xpu_precision)
+      .def_readwrite("xpu_adaptive_seqlen",
+                     &RuntimeOption::xpu_adaptive_seqlen)
+      .def_readwrite("xpu_enable_multi_stream",
+                     &RuntimeOption::xpu_enable_multi_stream);                              
 
   pybind11::class_<TensorInfo>(m, "TensorInfo")
       .def_readwrite("name", &TensorInfo::name)
diff --git a/fastdeploy/runtime.cc b/fastdeploy/runtime.cc
old mode 100644
new mode 100755
index 1a51cebea..565c10607
--- a/fastdeploy/runtime.cc
+++ b/fastdeploy/runtime.cc
@@ -236,7 +236,26 @@ void RuntimeOption::UseRKNPU2(fastdeploy::rknpu2::CpuName rknpu2_name,
 void RuntimeOption::UseTimVX() {
   enable_timvx = true;
   device = Device::TIMVX;
-  UseLiteBackend();
+}
+
+void RuntimeOption::UseXpu(int xpu_id, 
+                          int l3_workspace_size,
+                          bool locked,
+                          bool autotune,
+                          const std::string &autotune_file,
+                          const std::string &precision,
+                          bool adaptive_seqlen,
+                          bool enable_multi_stream) {
+  enable_xpu = true;
+  device_id = xpu_id;
+  xpu_l3_workspace_size = l3_workspace_size;
+  xpu_locked=locked;
+  xpu_autotune=autotune;
+  xpu_autotune_file=autotune_file;
+  xpu_precision = precision;
+  xpu_adaptive_seqlen=adaptive_seqlen;
+  xpu_enable_multi_stream=enable_multi_stream;
+  device = Device::XPU;
 }
 
 void RuntimeOption::SetExternalStream(void* external_stream) {
@@ -532,8 +551,8 @@ bool Runtime::Init(const RuntimeOption& _option) {
     FDINFO << "Runtime initialized with Backend::OPENVINO in "
            << Str(option.device) << "." << std::endl;
   } else if (option.backend == Backend::LITE) {
-    FDASSERT(option.device == Device::CPU || option.device == Device::TIMVX,
-             "Backend::LITE only supports Device::CPU/Device::TIMVX.");
+    FDASSERT(option.device == Device::CPU || option.device == Device::TIMVX || option.device == Device::XPU,
+             "Backend::LITE only supports Device::CPU/Device::TIMVX/Device::XPU.");
     CreateLiteBackend();
     FDINFO << "Runtime initialized with Backend::LITE in " << Str(option.device)
            << "." << std::endl;
@@ -784,6 +803,16 @@ void Runtime::CreateLiteBackend() {
   lite_option.nnadapter_subgraph_partition_config_path =
       option.lite_nnadapter_subgraph_partition_config_path;
   lite_option.enable_timvx = option.enable_timvx;
+  lite_option.enable_xpu = option.enable_xpu;
+  lite_option.device_id  = option.device_id;
+  lite_option.xpu_l3_workspace_size  = option.xpu_l3_workspace_size;
+  lite_option.xpu_locked = option.xpu_locked;
+  lite_option.xpu_autotune = option.xpu_autotune;
+  lite_option.xpu_autotune_file = option.xpu_autotune_file;
+  lite_option.xpu_precision  = option.xpu_precision;
+  lite_option.xpu_adaptive_seqlen = option.xpu_adaptive_seqlen;
+  lite_option.xpu_enable_multi_stream = option.xpu_enable_multi_stream;
+
   FDASSERT(option.model_format == ModelFormat::PADDLE,
            "LiteBackend only support model format of ModelFormat::PADDLE");
   backend_ = utils::make_unique<LiteBackend>();
diff --git a/fastdeploy/runtime.h b/fastdeploy/runtime.h
index 9c22c929f..064be2fce 100755
--- a/fastdeploy/runtime.h
+++ b/fastdeploy/runtime.h
@@ -102,6 +102,37 @@ struct FASTDEPLOY_DECL RuntimeOption {
   /// Use TimVX to inference
   void UseTimVX();
 
+  ///
+  /// \brief Turn on XPU.
+  ///
+  /// \param xpu_id the XPU card to use (default is 0).
+  /// \param l3_workspace_size The size of the video memory allocated by the l3
+  ///         cache, the maximum is 16M.
+  /// \param locked Whether the allocated L3 cache can be locked. If false,
+  ///       it means that the L3 cache is not locked, and the allocated L3
+  ///       cache can be shared by multiple models, and multiple models
+  ///       sharing the L3 cache will be executed sequentially on the card.
+  /// \param autotune Whether to autotune the conv operator in the model. If
+  ///       true, when the conv operator of a certain dimension is executed
+  ///       for the first time, it will automatically search for a better
+  ///       algorithm to improve the performance of subsequent conv operators
+  ///       of the same dimension.
+  /// \param autotune_file Specify the path of the autotune file. If
+  ///       autotune_file is specified, the algorithm specified in the
+  ///       file will be used and autotune will not be performed again.
+  /// \param precision Calculation accuracy of multi_encoder
+  /// \param adaptive_seqlen Is the input of multi_encoder variable length
+  /// \param enable_multi_stream Whether to enable the multi stream of xpu.
+  ///
+  void UseXpu(int xpu_id = 0,
+              int l3_workspace_size = 0xfffc00,
+              bool locked = false,
+              bool autotune = true,
+              const std::string& autotune_file = "",
+              const std::string& precision = "int16",
+              bool adaptive_seqlen = false,
+              bool enable_multi_stream = false);
+
   void SetExternalStream(void* external_stream);
 
   /*
@@ -354,6 +385,7 @@ struct FASTDEPLOY_DECL RuntimeOption {
   std::string lite_optimized_model_dir = "";
   std::string lite_nnadapter_subgraph_partition_config_path = "";
   bool enable_timvx = false;
+  bool enable_xpu = false;
 
   // ======Only for Trt Backend=======
   std::map<std::string, std::vector<int32_t>> trt_max_shape;
@@ -386,6 +418,15 @@ struct FASTDEPLOY_DECL RuntimeOption {
   fastdeploy::rknpu2::CoreMask rknpu2_core_mask_ =
       fastdeploy::rknpu2::CoreMask::RKNN_NPU_CORE_AUTO;
 
+  // ======Only for XPU Backend=======
+  int xpu_l3_workspace_size = 0xfffc00;
+  bool xpu_locked = false;
+  bool xpu_autotune = true;
+  std::string xpu_autotune_file = "";
+  std::string xpu_precision = "int16";
+  bool xpu_adaptive_seqlen = false;
+  bool xpu_enable_multi_stream = false;
+
   std::string model_file = "";   // Path of model file
   std::string params_file = "";  // Path of parameters file, can be empty
   // format of input model
diff --git a/fastdeploy/vision/classification/ppcls/model.cc b/fastdeploy/vision/classification/ppcls/model.cc
index 5065bbfc2..e1b8d5249 100755
--- a/fastdeploy/vision/classification/ppcls/model.cc
+++ b/fastdeploy/vision/classification/ppcls/model.cc
@@ -29,6 +29,7 @@ PaddleClasModel::PaddleClasModel(const std::string& model_file,
                           Backend::LITE};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     valid_timvx_backends = {Backend::LITE};
+    valid_xpu_backends = {Backend::LITE};
     valid_ipu_backends = {Backend::PDINFER};
   } else if (model_format == ModelFormat::ONNX) {
     valid_cpu_backends = {Backend::ORT, Backend::OPENVINO};
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
index 238c1c465..6dcda3b77 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
@@ -72,10 +72,11 @@ class FASTDEPLOY_DECL RKYOLOPostprocessor {
   }
 
   // Set Anchor
-  void SetAnchor(std::vector<int> anchors,int anchor_per_branch){
+  void SetAnchor(std::vector<int> anchors, int anchor_per_branch) {
       anchors_ = anchors;
       anchor_per_branch_ = anchor_per_branch;
-  };
+  }
+
  private:
   std::vector<int> anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
                                45, 59, 119, 116, 90, 156, 198, 373, 326};
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/utils.h b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
index 1d28b5f0e..1fa533082 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/utils.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
@@ -31,4 +31,4 @@ int NMS(int valid_count, std::vector<float>& output_locations,
 
 }  // namespace detection
 }  // namespace vision
-}  // namespace fastdeploy
\ No newline at end of file
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc b/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
index 92d53dd10..d1bb31f22 100755
--- a/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
+++ b/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
@@ -27,6 +27,7 @@ YOLOv5::YOLOv5(const std::string& model_file, const std::string& params_file,
   } else {
     valid_cpu_backends = {Backend::PDINFER, Backend::ORT, Backend::LITE};
     valid_gpu_backends = {Backend::PDINFER, Backend::ORT, Backend::TRT};
+    valid_xpu_backends = {Backend::LITE};
     valid_timvx_backends = {Backend::LITE};
   }
   runtime_option = custom_option;
diff --git a/fastdeploy/vision/detection/ppdet/model.h b/fastdeploy/vision/detection/ppdet/model.h
index 5175bc4e6..090c99de7 100755
--- a/fastdeploy/vision/detection/ppdet/model.h
+++ b/fastdeploy/vision/detection/ppdet/model.h
@@ -185,7 +185,7 @@ class FASTDEPLOY_DECL PaddleYOLOv5 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::ORT,Backend::PDINFER};
+    valid_cpu_backends = {Backend::ORT, Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
@@ -201,7 +201,7 @@ class FASTDEPLOY_DECL PaddleYOLOv6 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::OPENVINO, Backend::ORT,Backend::PDINFER};
+    valid_cpu_backends = {Backend::OPENVINO, Backend::ORT, Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
@@ -217,7 +217,7 @@ class FASTDEPLOY_DECL PaddleYOLOv7 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::ORT,Backend::PDINFER};
+    valid_cpu_backends = {Backend::ORT, Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
diff --git a/python/fastdeploy/runtime.py b/python/fastdeploy/runtime.py
index 6461da66d..f9334efbf 100755
--- a/python/fastdeploy/runtime.py
+++ b/python/fastdeploy/runtime.py
@@ -245,6 +245,34 @@ class RuntimeOption:
             return
         return self._option.use_gpu(device_id)
 
+    def use_xpu(self,
+                device_id=0,
+                l3_workspace_size=16 * 1024 * 1024,
+                locked=False,
+                autotune=True,
+                autotune_file="",
+                precision="int16",
+                adaptive_seqlen=False,
+                enable_multi_stream=False):
+        """Inference with XPU
+
+        :param device_id: (int)The index of XPU will be used for inference, default 0
+        :param l3_workspace_size: (int)The size of the video memory allocated by the l3 cache, the maximum is 16M, default 16M
+        :param locked: (bool)Whether the allocated L3 cache can be locked. If false, it means that the L3 cache is not locked,
+                        and the allocated L3 cache can be shared by multiple models, and multiple models
+        :param autotune: (bool)Whether to autotune the conv operator in the model.
+                        If true, when the conv operator of a certain dimension is executed for the first time,
+                        it will automatically search for a better algorithm to improve the performance of subsequent conv operators of the same dimension.
+        :param autotune_file: (str)Specify the path of the autotune file. If autotune_file is specified,
+                        the algorithm specified in the file will be used and autotune will not be performed again.
+        :param precision: (str)Calculation accuracy of multi_encoder
+        :param adaptive_seqlen: (bool)adaptive_seqlen Is the input of multi_encoder variable length
+        :param enable_multi_stream: (bool)Whether to enable the multi stream of xpu.
+        """
+        return self._option.use_xpu(device_id, l3_workspace_size, locked,
+                                    autotune, autotune_file, precision,
+                                    adaptive_seqlen, enable_multi_stream)
+
     def use_cpu(self):
         """Inference with CPU
         """
diff --git a/python/setup.py b/python/setup.py
index b4dc111c6..19a857678 100755
--- a/python/setup.py
+++ b/python/setup.py
@@ -65,11 +65,13 @@ setup_configs["ENABLE_POROS_BACKEND"] = os.getenv("ENABLE_POROS_BACKEND",
                                                   "OFF")
 setup_configs["ENABLE_TRT_BACKEND"] = os.getenv("ENABLE_TRT_BACKEND", "OFF")
 setup_configs["ENABLE_LITE_BACKEND"] = os.getenv("ENABLE_LITE_BACKEND", "OFF")
+setup_configs["PADDLELITE_URL"] = os.getenv("PADDLELITE_URL", "OFF")
 setup_configs["ENABLE_VISION"] = os.getenv("ENABLE_VISION", "OFF")
 setup_configs["ENABLE_FLYCV"] = os.getenv("ENABLE_FLYCV", "OFF")
 setup_configs["ENABLE_TEXT"] = os.getenv("ENABLE_TEXT", "OFF")
 setup_configs["WITH_GPU"] = os.getenv("WITH_GPU", "OFF")
 setup_configs["WITH_IPU"] = os.getenv("WITH_IPU", "OFF")
+setup_configs["WITH_XPU"] = os.getenv("WITH_XPU", "OFF")
 setup_configs["BUILD_ON_JETSON"] = os.getenv("BUILD_ON_JETSON", "OFF")
 setup_configs["TRT_DIRECTORY"] = os.getenv("TRT_DIRECTORY", "UNDEFINED")
 setup_configs["CUDA_DIRECTORY"] = os.getenv("CUDA_DIRECTORY",
@@ -78,10 +80,12 @@ setup_configs["LIBRARY_NAME"] = PACKAGE_NAME
 setup_configs["PY_LIBRARY_NAME"] = PACKAGE_NAME + "_main"
 setup_configs["OPENCV_DIRECTORY"] = os.getenv("OPENCV_DIRECTORY", "")
 setup_configs["ORT_DIRECTORY"] = os.getenv("ORT_DIRECTORY", "")
-setup_configs["PADDLEINFERENCE_DIRECTORY"] = os.getenv("PADDLEINFERENCE_DIRECTORY", "")
+setup_configs["PADDLEINFERENCE_DIRECTORY"] = os.getenv(
+    "PADDLEINFERENCE_DIRECTORY", "")
 
 setup_configs["RKNN2_TARGET_SOC"] = os.getenv("RKNN2_TARGET_SOC", "")
-if setup_configs["RKNN2_TARGET_SOC"] != "" or setup_configs["BUILD_ON_JETSON"] != "OFF":
+if setup_configs["RKNN2_TARGET_SOC"] != "" or setup_configs[
+        "BUILD_ON_JETSON"] != "OFF":
     REQUIRED_PACKAGES = REQUIRED_PACKAGES.replace("opencv-python", "")
 
 if setup_configs["WITH_GPU"] == "ON" or setup_configs[

From 0990ab9b50f13109bbd82b1299d37eb75301e2ec Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Thu, 15 Dec 2022 21:17:59 +0800
Subject: [PATCH 70/77] Revert "[Backend] Add KunlunXin XPU deploy support"
 (#893)

Revert "[Backend] Add KunlunXin XPU deploy support (#747)"

This reverts commit 5be839b322b6adf46329933361b22b4984c42ef8.
---
 CMakeLists.txt                                |  20 +--
 FastDeploy.cmake.in                           |   5 -
 cmake/summary.cmake                           |   2 -
 docs/README_CN.md                             |   1 -
 docs/README_EN.md                             |   5 +-
 docs/cn/build_and_install/README.md           |   8 +-
 docs/cn/build_and_install/a311d.md            |   3 +-
 docs/cn/build_and_install/rv1126.md           |   7 +-
 docs/cn/build_and_install/xpu.md              |  75 ---------
 docs/en/build_and_install/README.md           |   5 -
 docs/en/build_and_install/a311d.md            | 105 ------------
 docs/en/build_and_install/rv1126.md           | 105 ------------
 docs/en/build_and_install/xpu.md              |  78 ---------
 .../classification/paddleclas/cpp/README.md   |   4 -
 .../classification/paddleclas/cpp/infer.cc    |  30 +---
 .../paddleclas/python/README.md               |   2 -
 .../classification/paddleclas/python/infer.py |   3 -
 .../detection/yolov5/cpp/CMakeLists.txt       |   4 -
 .../vision/detection/yolov5/cpp/README.md     |  24 +--
 examples/vision/detection/yolov5/cpp/infer.cc |   2 +-
 .../yolov5/cpp/infer_paddle_model.cc          | 154 ------------------
 .../vision/detection/yolov5/python/README.md  |  11 +-
 .../vision/detection/yolov5/python/infer.py   |  21 +--
 fastdeploy/backends/lite/lite_backend.cc      |  56 ++-----
 fastdeploy/backends/lite/lite_backend.h       |   9 -
 fastdeploy/core/fd_type.cc                    |   6 -
 fastdeploy/core/fd_type.h                     |   2 +-
 fastdeploy/fastdeploy_model.cc                |  33 +---
 fastdeploy/fastdeploy_model.h                 |   4 -
 fastdeploy/pybind/runtime.cc                  |  17 +-
 fastdeploy/runtime.cc                         |  35 +---
 fastdeploy/runtime.h                          |  41 -----
 .../vision/classification/ppcls/model.cc      |   1 -
 .../detection/contrib/rknpu2/postprocessor.h  |   5 +-
 .../vision/detection/contrib/rknpu2/utils.h   |   2 +-
 .../vision/detection/contrib/yolov5/yolov5.cc |   1 -
 fastdeploy/vision/detection/ppdet/model.h     |   6 +-
 python/fastdeploy/runtime.py                  |  28 ----
 python/setup.py                               |   8 +-
 39 files changed, 58 insertions(+), 870 deletions(-)
 mode change 100755 => 100644 docs/README_CN.md
 mode change 100755 => 100644 docs/README_EN.md
 delete mode 100755 docs/cn/build_and_install/xpu.md
 mode change 100755 => 100644 docs/en/build_and_install/README.md
 delete mode 100755 docs/en/build_and_install/a311d.md
 delete mode 100755 docs/en/build_and_install/rv1126.md
 delete mode 100755 docs/en/build_and_install/xpu.md
 mode change 100755 => 100644 examples/vision/classification/paddleclas/cpp/README.md
 mode change 100755 => 100644 examples/vision/classification/paddleclas/cpp/infer.cc
 mode change 100755 => 100644 examples/vision/classification/paddleclas/python/README.md
 mode change 100755 => 100644 examples/vision/classification/paddleclas/python/infer.py
 mode change 100755 => 100644 examples/vision/detection/yolov5/cpp/CMakeLists.txt
 mode change 100755 => 100644 examples/vision/detection/yolov5/cpp/README.md
 mode change 100755 => 100644 examples/vision/detection/yolov5/cpp/infer.cc
 delete mode 100755 examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
 mode change 100755 => 100644 examples/vision/detection/yolov5/python/README.md
 mode change 100755 => 100644 examples/vision/detection/yolov5/python/infer.py
 mode change 100755 => 100644 fastdeploy/pybind/runtime.cc
 mode change 100755 => 100644 fastdeploy/runtime.cc

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 0bcfa4084..c02e887a5 100755
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -40,7 +40,7 @@ if(NOT MSVC)
   add_definitions(-D_GLIBCXX_USE_CXX11_ABI=1)
 endif(NOT MSVC)
 
-if(UNIX AND (NOT APPLE) AND (NOT ANDROID) AND (NOT WITH_TIMVX))
+if(UNIX AND (NOT APPLE) AND (NOT ANDROID) AND (NOT ENABLE_TIMVX))
   include(${PROJECT_SOURCE_DIR}/cmake/patchelf.cmake)
 endif()
 
@@ -64,8 +64,7 @@ option(ENABLE_LITE_BACKEND "Whether to enable paddle lite backend." OFF)
 option(ENABLE_VISION "Whether to enable vision models usage." OFF)
 option(ENABLE_TEXT "Whether to enable text models usage." OFF)
 option(ENABLE_FLYCV "Whether to enable flycv to boost image preprocess." OFF)
-option(WITH_TIMVX "Whether to compile for TIMVX deploy." OFF)
-option(WITH_XPU "Whether to compile for KunlunXin XPU deploy." OFF)
+option(ENABLE_TIMVX "Whether to compile for TIMVX deploy." OFF)
 option(WITH_TESTING "Whether to compile with unittest." OFF)
 ############################# Options for Android cross compiling #########################
 option(WITH_OPENCV_STATIC "Use OpenCV static lib for Android." OFF)
@@ -139,23 +138,10 @@ set(HEAD_DIR "${PROJECT_SOURCE_DIR}/${CSRCS_DIR_NAME}")
 include_directories(${HEAD_DIR})
 include_directories(${CMAKE_CURRENT_BINARY_DIR})
 
-if (WITH_TIMVX)
+if (ENABLE_TIMVX)
   include(${PROJECT_SOURCE_DIR}/cmake/timvx.cmake)
 endif()
 
-if (WITH_XPU)
-  if(NOT ENABLE_LITE_BACKEND)
-      message(WARNING "While compiling with -DWITH_XPU=ON, will force to set -DENABLE_LITE_BACKEND=ON")
-      set(ENABLE_LITE_BACKEND ON)
-  endif()
-  if(NOT CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "x86_64")
-    message(FATAL_ERROR "XPU is only supported on Linux x64 platform")
-  endif()
-  if(NOT PADDLELITE_URL)
-    set(PADDLELITE_URL "https://bj.bcebos.com/fastdeploy/third_libs/lite-linux-x64-xpu-20221215.tgz")
-  endif()
-endif()
-
 
 if(ANDROID OR IOS)
   if(ENABLE_ORT_BACKEND)
diff --git a/FastDeploy.cmake.in b/FastDeploy.cmake.in
index d8c0df3d6..fd0ea847a 100755
--- a/FastDeploy.cmake.in
+++ b/FastDeploy.cmake.in
@@ -27,7 +27,6 @@ set(OPENCV_DIRECTORY "@OPENCV_DIRECTORY@")
 set(ORT_DIRECTORY "@ORT_DIRECTORY@")
 set(OPENVINO_DIRECTORY "@OPENVINO_DIRECTORY@")
 set(RKNN2_TARGET_SOC "@RKNN2_TARGET_SOC@")
-set(WITH_XPU @WITH_XPU@)
 
 set(FASTDEPLOY_LIBS "")
 set(FASTDEPLOY_INCS "")
@@ -238,10 +237,6 @@ if(ENABLE_PADDLE_FRONTEND)
   list(APPEND FASTDEPLOY_LIBS ${PADDLE2ONNX_LIB})
 endif()
 
-if(WITH_XPU)
-  list(APPEND FASTDEPLOY_LIBS -lpthread -lrt -ldl)
-endif()
-
 remove_duplicate_libraries(FASTDEPLOY_LIBS)
 
 # Print compiler information
diff --git a/cmake/summary.cmake b/cmake/summary.cmake
index fc5c246ba..7a729484e 100755
--- a/cmake/summary.cmake
+++ b/cmake/summary.cmake
@@ -37,8 +37,6 @@ function(fastdeploy_summary)
   message(STATUS "  ENABLE_POROS_BACKEND      : ${ENABLE_POROS_BACKEND}")
   message(STATUS "  ENABLE_TRT_BACKEND        : ${ENABLE_TRT_BACKEND}")
   message(STATUS "  ENABLE_OPENVINO_BACKEND   : ${ENABLE_OPENVINO_BACKEND}")
-  message(STATUS "  WITH_TIMVX                : ${WITH_TIMVX}")
-  message(STATUS "  WITH_XPU                  : ${WITH_XPU}")
   if(ENABLE_ORT_BACKEND)
     message(STATUS "  ONNXRuntime version       : ${ONNXRUNTIME_VERSION}")
   endif()
diff --git a/docs/README_CN.md b/docs/README_CN.md
old mode 100755
new mode 100644
index ec0267f45..a0b7b51d0
--- a/docs/README_CN.md
+++ b/docs/README_CN.md
@@ -8,7 +8,6 @@
 - [GPU部署环境编译安装](cn/build_and_install/gpu.md)
 - [CPU部署环境编译安装](cn/build_and_install/cpu.md)
 - [IPU部署环境编译安装](cn/build_and_install/ipu.md)
-- [昆仑芯XPU部署环境编译安装](cn/build_and_install/xpu.md)
 - [Jetson部署环境编译安装](cn/build_and_install/jetson.md)
 - [Android平台部署环境编译安装](cn/build_and_install/android.md)
 - [服务化部署镜像编译安装](../serving/docs/zh_CN/compile.md)
diff --git a/docs/README_EN.md b/docs/README_EN.md
old mode 100755
new mode 100644
index ed257c59b..c4f9adfa3
--- a/docs/README_EN.md
+++ b/docs/README_EN.md
@@ -8,7 +8,6 @@
 - [Build and Install FastDeploy Library on GPU Platform](en/build_and_install/gpu.md)
 - [Build and Install FastDeploy Library on CPU Platform](en/build_and_install/cpu.md)
 - [Build and Install FastDeploy Library on IPU Platform](en/build_and_install/ipu.md)
-- [Build and Install FastDeploy Library on KunlunXin XPU Platform](en/build_and_install/xpu.md)
 - [Build and Install FastDeploy Library on  Nvidia Jetson Platform](en/build_and_install/jetson.md)
 - [Build and Install FastDeploy Library on Android Platform](en/build_and_install/android.md)
 - [Build and Install FastDeploy Serving Deployment Image](../serving/docs/EN/compile-en.md)
@@ -20,10 +19,10 @@
 - [A Quick Start on Runtime Python](en/quick_start/runtime/python.md)
 - [A Quick Start on Runtime C++](en/quick_start/runtime/cpp.md)
 
-## API
+## API 
 
 - [Python API](https://baidu-paddle.github.io/fastdeploy-api/python/html/)
-- [C++ API](https://baidu-paddle.github.io/fastdeploy-api/cpp/html/)
+- [C++ API](https://baidu-paddle.github.io/fastdeploy-api/cpp/html/) 
 - [Android Java API](../java/android)
 
 ## Performance Optimization
diff --git a/docs/cn/build_and_install/README.md b/docs/cn/build_and_install/README.md
index 221852d2c..7ec07c7b8 100755
--- a/docs/cn/build_and_install/README.md
+++ b/docs/cn/build_and_install/README.md
@@ -13,7 +13,6 @@
 - [Android平台部署环境](android.md)
 - [瑞芯微RV1126部署环境](rv1126.md)
 - [晶晨A311D部署环境](a311d.md)
-- [昆仑芯XPU部署环境](xpu.md)
 
 
 ## FastDeploy编译选项说明
@@ -21,11 +20,10 @@
 | 选项                      | 说明                                                                        |
 |:------------------------|:--------------------------------------------------------------------------|
 | ENABLE_ORT_BACKEND      | 默认OFF, 是否编译集成ONNX Runtime后端(CPU/GPU上推荐打开)                                 |
-| ENABLE_PADDLE_BACKEND   | 默认OFF，是否编译集成Paddle Inference后端(CPU/GPU上推荐打开)                             |  
-| ENABLE_LITE_BACKEND     | 默认OFF，是否编译集成Paddle Lite后端(编译Android库时需要设置为ON)                          |
+| ENABLE_PADDLE_BACKEND   | 默认OFF，是否编译集成Paddle Inference后端(CPU/GPU上推荐打开)                              |  
+| ENABLE_LITE_BACKEND     | 默认OFF，是否编译集成Paddle Lite后端(编译Android库时需要设置为ON)                             |
 | ENABLE_RKNPU2_BACKEND   | 默认OFF，是否编译集成RKNPU2后端(RK3588/RK3568/RK3566上推荐打开)                           |
-| WITH_XPU                | 默认OFF，当在昆仑芯XPU上部署时，需设置为ON                                                |
-| WITH_TIMVX              | 默认OFF，需要在RV1126/RV1109/A311D上部署时，需设置为ON                                   |
+| WITH_TIMVX            | 默认OFF，需要在RV1126/RV1109/A311D上部署时，需设置为ON                                   |
 | ENABLE_TRT_BACKEND      | 默认OFF，是否编译集成TensorRT后端(GPU上推荐打开)                                          |
 | ENABLE_OPENVINO_BACKEND | 默认OFF，是否编译集成OpenVINO后端(CPU上推荐打开)                                          |
 | ENABLE_VISION           | 默认OFF，是否编译集成视觉模型的部署模块                                                     |
diff --git a/docs/cn/build_and_install/a311d.md b/docs/cn/build_and_install/a311d.md
index 20dde7046..4b3773f0d 100755
--- a/docs/cn/build_and_install/a311d.md
+++ b/docs/cn/build_and_install/a311d.md
@@ -9,8 +9,7 @@ FastDeploy 基于 Paddle-Lite 后端支持在晶晨 NPU 上进行部署推理。
 |编译选项|默认值|说明|备注|  
 |:---|:---|:---|:---|  
 |ENABLE_LITE_BACKEND|OFF|编译A311D部署库时需要设置为ON| - |
-|WITH_TIMVX|OFF|编译A311D部署库时需要设置为ON| - |  
-|TARGET_ABI|NONE|编译RK库时需要设置为arm64| - |
+|WITH_TIMVX|OFF|编译A311D部署库时需要设置为ON| - |
 
 更多编译选项请参考[FastDeploy编译选项说明](./README.md)
 
diff --git a/docs/cn/build_and_install/rv1126.md b/docs/cn/build_and_install/rv1126.md
index f3643f070..ff0050715 100755
--- a/docs/cn/build_and_install/rv1126.md
+++ b/docs/cn/build_and_install/rv1126.md
@@ -8,9 +8,8 @@ FastDeploy基于 Paddle-Lite 后端支持在瑞芯微（Rockchip）Soc 上进行
 相关编译选项说明如下：  
 |编译选项|默认值|说明|备注|  
 |:---|:---|:---|:---|  
-|ENABLE_LITE_BACKEND|OFF|编译RK库时需要设置为ON| - |  
-|WITH_TIMVX|OFF|编译RK库时需要设置为ON| - |  
-|TARGET_ABI|NONE|编译RK库时需要设置为armhf| - |
+|ENABLE_LITE_BACKEND|OFF|编译RK库时需要设置为ON| - |
+|WITH_TIMVX|OFF|编译RK库时需要设置为ON| - |
 
 更多编译选项请参考[FastDeploy编译选项说明](./README.md)
 
@@ -87,7 +86,7 @@ dmesg | grep Galcore
 wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
 tar -xf PaddleLite-generic-demo.tar.gz
 ```
-2. 使用 `uname -a` 查看 `Linux Kernel` 版本，确定为 `Linux` 系统 4.19.111 版本
+2. 使用 `uname -a` 查看 `Linux Kernel` 版本，确定为 `Linux` 系统 4.19.111 版本，
 3. 将 `PaddleLite-generic-demo/libs/PaddleLite/linux/armhf/lib/verisilicon_timvx/viv_sdk_6_4_6_5/lib/1126/4.19.111/` 路径下的 `galcore.ko` 上传至开发板。
 
 4. 登录开发板，命令行输入 `sudo rmmod galcore` 来卸载原始驱动，输入 `sudo insmod galcore.ko` 来加载传上设备的驱动。（是否需要 sudo 根据开发板实际情况，部分 adb 链接的设备请提前 adb root）。此步骤如果操作失败，请跳转至方法 2。
diff --git a/docs/cn/build_and_install/xpu.md b/docs/cn/build_and_install/xpu.md
deleted file mode 100755
index 014eb804d..000000000
--- a/docs/cn/build_and_install/xpu.md
+++ /dev/null
@@ -1,75 +0,0 @@
-# 昆仑芯 XPU 部署环境编译安装
-
-FastDeploy 基于 Paddle-Lite 后端支持在昆仑芯 XPU 上进行部署推理。
-更多详细的信息请参考：[PaddleLite部署示例](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/kunlunxin_xpu.html#xpu)。
-
-本文档介绍如何编译基于 PaddleLite 的 C++ FastDeploy 编译库。
-
-相关编译选项说明如下：  
-|编译选项|默认值|说明|备注|  
-|:---|:---|:---|:---|  
-| WITH_XPU| OFF | 需要在XPU上部署时需要设置为ON | - |
-| ENABLE_ORT_BACKEND | OFF | 是否编译集成ONNX Runtime后端 | - |
-| ENABLE_PADDLE_BACKEND | OFF | 是否编译集成Paddle Inference后端 | - |
-| ENABLE_OPENVINO_BACKEND | OFF | 是否编译集成OpenVINO后端 | - |
-| ENABLE_VISION | OFF | 是否编译集成视觉模型的部署模块 | - |
-| ENABLE_TEXT | OFF | 是否编译集成文本NLP模型的部署模块 | - |
-
-第三方库依赖指定（不设定如下参数，会自动下载预编译库）
-| 选项                     | 说明                                                                                           |
-| :---------------------- | :--------------------------------------------------------------------------------------------- |
-| ORT_DIRECTORY           | 当开启ONNX Runtime后端时，用于指定用户本地的ONNX Runtime库路径；如果不指定，编译过程会自动下载ONNX Runtime库  |
-| OPENCV_DIRECTORY        | 当ENABLE_VISION=ON时，用于指定用户本地的OpenCV库路径；如果不指定，编译过程会自动下载OpenCV库              |
-| OPENVINO_DIRECTORY      | 当开启OpenVINO后端时, 用于指定用户本地的OpenVINO库路径；如果不指定，编译过程会自动下载OpenVINO库             |
-更多编译选项请参考[FastDeploy编译选项说明](./README.md)
-
-## 基于 PaddleLite 的 C++ FastDeploy 库编译
-- OS: Linux
-- gcc/g++: version >= 8.2
-- cmake: version >= 3.15
-此外更推荐开发者自行安装，编译时通过`-DOPENCV_DIRECTORY`来指定环境中的OpenCV（如若不指定-DOPENCV_DIRECTORY，会自动下载FastDeploy提供的预编译的OpenCV，但在**Linux平台**无法支持Video的读取，以及imshow等可视化界面功能）
-```
-sudo apt-get install libopencv-dev
-```
-编译命令如下：
-```bash
-# Download the latest source code
-git clone https://github.com/PaddlePaddle/FastDeploy.git
-cd FastDeploy  
-mkdir build && cd build
-
-# CMake configuration with KunlunXin xpu toolchain
-cmake -DWITH_XPU=ON  \
-      -DWITH_GPU=OFF  \ # 不编译 GPU
-      -DENABLE_ORT_BACKEND=ON  \ # 可选择开启 ORT 后端
-      -DENABLE_PADDLE_BACKEND=ON  \ # 可选择开启 Paddle 后端
-      -DCMAKE_INSTALL_PREFIX=fastdeploy-xpu \
-      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
-      -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
-      ..
-
-# Build FastDeploy KunlunXin XPU C++ SDK
-make -j8
-make install
-```  
-编译完成之后，会生成 fastdeploy-xpu 目录，表示基于 PadddleLite 的 FastDeploy 库编译完成。
-
-## Python 编译
-编译命令如下：
-```bash
-git clone https://github.com/PaddlePaddle/FastDeploy.git
-cd FastDeploy/python
-export WITH_XPU=ON
-export WITH_GPU=OFF
-export ENABLE_ORT_BACKEND=ON
-export ENABLE_PADDLE_BACKEND=ON
-export ENABLE_VISION=ON
-# OPENCV_DIRECTORY可选，不指定会自动下载FastDeploy提供的预编译OpenCV库
-export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
-
-python setup.py build
-python setup.py bdist_wheel
-```  
-编译完成即会在 `FastDeploy/python/dist` 目录下生成编译后的 `wheel` 包，直接 pip install 即可
-
-编译过程中，如若修改编译参数，为避免带来缓存影响，可删除 `FastDeploy/python` 目录下的 `build` 和 `.setuptools-cmake-build` 两个子目录后再重新编译
diff --git a/docs/en/build_and_install/README.md b/docs/en/build_and_install/README.md
old mode 100755
new mode 100644
index 0958c3778..4beaaeec8
--- a/docs/en/build_and_install/README.md
+++ b/docs/en/build_and_install/README.md
@@ -12,9 +12,6 @@ English | [中文](../../cn/build_and_install/README.md)
 - [Build and Install on IPU Platform](ipu.md)
 - [Build and Install on Nvidia Jetson Platform](jetson.md)
 - [Build and Install on Android Platform](android.md)
-- [Build and Install on RV1126 Platform](rv1126.md)
-- [Build and Install on A311D Platform](a311d.md)
-- [Build and Install on KunlunXin XPU Platform](xpu.md)
 
 
 ## Build options
@@ -28,8 +25,6 @@ English | [中文](../../cn/build_and_install/README.md)
 | ENABLE_VISION | Default OFF，whether to enable vision models deployment module |
 | ENABLE_TEXT | Default OFF，whether to enable text models deployment module |
 | WITH_GPU | Default OFF, if build on GPU, this need to be ON |
-| WITH_XPU | Default OFF，if deploy on KunlunXin XPU，this need to be ON |
-| WITH_TIMVX | Default OFF，if deploy on RV1126/RV1109/A311D，this need to be ON |
 | CUDA_DIRECTORY | Default /usr/local/cuda, if build on GPU, this defines the path of CUDA(>=11.2) |
 | TRT_DIRECTORY | If build with ENABLE_TRT_BACKEND=ON, this defines the path of TensorRT(>=8.4) |
 | ORT_DIRECTORY | [Optional] If build with ENABLE_ORT_BACKEND=ON, this flag defines the path of ONNX Runtime, but if this flag is not set, it will download ONNX Runtime library automatically |
diff --git a/docs/en/build_and_install/a311d.md b/docs/en/build_and_install/a311d.md
deleted file mode 100755
index 872c1b93c..000000000
--- a/docs/en/build_and_install/a311d.md
+++ /dev/null
@@ -1,105 +0,0 @@
-# How to Build A311D Deployment Environment
-
-FastDeploy supports AI deployment on Rockchip Soc based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html).
-
-This document describes how to compile the PaddleLite-based C++ FastDeploy cross-compilation library.
-
-The relevant compilation options are described as follows:  
-|Compile Options|Default Values|Description|Remarks|  
-|:---|:---|:---|:---|  
-|ENABLE_LITE_BACKEND|OFF|It needs to be set to ON when compiling the A311D library| - |  
-|WITH_TIMVX|OFF|It needs to be set to ON when compiling the A311D library| - |  
-|TARGET_ABI|NONE|It needs to be set to arm64 when compiling the A311D library| - |  
-
-For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
-
-## Cross-compilation environment construction
-
-### Host Environment Requirements  
-- os：Ubuntu == 16.04
-- cmake： version >= 3.10.0  
-
-### Building the compilation environment
-You can enter the FastDeploy/tools/timvx directory and use the following command to install:
-```bash
-cd FastDeploy/tools/timvx
-bash install.sh
-```
-You can also install it with the following commands:
-```bash
- # 1. Install basic software
-apt update
-apt-get install -y --no-install-recommends \
-  gcc g++ git make wget python unzip
-
-# 2. Install arm gcc toolchains
-apt-get install -y --no-install-recommends \
-  g++-arm-linux-gnueabi gcc-arm-linux-gnueabi \
-  g++-arm-linux-gnueabihf gcc-arm-linux-gnueabihf \
-  gcc-aarch64-linux-gnu g++-aarch64-linux-gnu
-
-# 3. Install cmake 3.10 or above
-wget -c https://mms-res.cdn.bcebos.com/cmake-3.10.3-Linux-x86_64.tar.gz && \
-  tar xzf cmake-3.10.3-Linux-x86_64.tar.gz && \
-  mv cmake-3.10.3-Linux-x86_64 /opt/cmake-3.10 && \
-  ln -s /opt/cmake-3.10/bin/cmake /usr/bin/cmake && \
-  ln -s /opt/cmake-3.10/bin/ccmake /usr/bin/ccmake
-```
-
-## FastDeploy cross-compilation library compilation based on PaddleLite
-After setting up the cross-compilation environment, the compilation command is as follows:
-```bash
-# Download the latest source code
-git clone https://github.com/PaddlePaddle/FastDeploy.git
-cd FastDeploy  
-mkdir build && cd build
-
-# CMake configuration with A311D toolchain
-cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/toolchain.cmake \
-      -DWITH_TIMVX=ON  \
-      -DTARGET_ABI=arm64 \
-      -DCMAKE_INSTALL_PREFIX=fastdeploy-tmivx \
-      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
-      -Wno-dev ..
-
-# Build FastDeploy A311D C++ SDK
-make -j8
-make install
-```  
-After the compilation is complete, the fastdeploy-tmivx directory will be generated, indicating that the FastDeploy library based on PadddleLite TIM-VX has been compiled.
-
-## Prepare the Soc environment
-Before deployment, ensure that the version of the driver galcore.so of the Verisilicon Linux Kernel NPU meets the requirements. Before deployment, please log in to the development board, and enter the following command through the command line to query the NPU driver version. The recommended version of the Rockchip driver is: 6.4.4.3
-```bash
-dmesg | grep Galcore
-```  
-If the current version does not comply with the above, please read the following content carefully to ensure that the underlying NPU driver environment is correct.
-
-There are two ways to modify the current NPU driver version:
-1. Manually replace the NPU driver version. (recommend)
-2. flash the machine, and flash the firmware that meets the requirements of the NPU driver version.
-
-### Manually replace the NPU driver version
-1. Use the following command to download and decompress the PaddleLite demo, which provides ready-made driver files
-```bash
-wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
-tar -xf PaddleLite-generic-demo.tar.gz
-```
-2. Use `uname -a` to check `Linux Kernel` version, it is determined to be version 4.19.111.
-3. Upload `galcore.ko` under `PaddleLite-generic-demo/libs/PaddleLite/linux/arm64/lib/verisilicon_timvx/viv_sdk_6_4_4_3/lib/a311d/4.9.113` path to the development board.
-4. Log in to the development board, enter `sudo rmmod galcore` on the command line to uninstall the original driver, and enter `sudo insmod galcore.ko` to load the uploaded device driver. (Whether sudo is needed depends on the actual situation of the development board. For some adb-linked devices, please adb root in advance). If this step fails, go to method 2.
-5. Enter `dmesg | grep Galcore` in the development board to query the NPU driver version, and it is determined to be: 6.4.4.3
-
-### flash
-According to the specific development board model, ask the development board seller or the official website customer service for the firmware and flashing method corresponding to the 6.4.4.3 version of the NPU driver.
-
-For more details, please refer to: [PaddleLite prepares the device environment](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html#zhunbeishebeihuanjing)
-
-## Deployment example based on FastDeploy on A311D
-1. For deploying the PaddleClas classification model on A311D, please refer to: [C++ deployment example of PaddleClas classification model on A311D](../../../examples/vision/classification/paddleclas/a311d/README.md)
-
-2. For deploying PPYOLOE detection model on A311D, please refer to: [C++ deployment example of PPYOLOE detection model on A311D](../../../examples/vision/detection/paddledetection/a311d/README.md)
-
-3. For deploying YOLOv5 detection model on A311D, please refer to: [C++ Deployment Example of YOLOv5 Detection Model on A311D](../../../examples/vision/detection/yolov5/a311d/README.md)
-
-4. For deploying PP-LiteSeg segmentation model on A311D, please refer to: [C++ Deployment Example of PP-LiteSeg Segmentation Model on A311D](../../../examples/vision/segmentation/paddleseg/a311d/README.md)
diff --git a/docs/en/build_and_install/rv1126.md b/docs/en/build_and_install/rv1126.md
deleted file mode 100755
index a56535363..000000000
--- a/docs/en/build_and_install/rv1126.md
+++ /dev/null
@@ -1,105 +0,0 @@
-# How to Build RV1126 Deployment Environment
-
-FastDeploy supports AI deployment on Rockchip Soc based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html).
-
-This document describes how to compile the PaddleLite-based C++ FastDeploy cross-compilation library.
-
-The relevant compilation options are described as follows:  
-|Compile Options|Default Values|Description|Remarks|  
-|:---|:---|:---|:---|  
-|ENABLE_LITE_BACKEND|OFF|It needs to be set to ON when compiling the RK library| - |  
-|WITH_TIMVX|OFF|It needs to be set to ON when compiling the RK library| - |  
-|TARGET_ABI|NONE|It needs to be set to armhf when compiling the RK library| - |  
-
-For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
-
-## Cross-compilation environment construction
-
-### Host Environment Requirements  
-- os：Ubuntu == 16.04
-- cmake： version >= 3.10.0  
-
-### Building the compilation environment
-You can enter the FastDeploy/tools/timvx directory and use the following command to install:
-```bash
-cd FastDeploy/tools/timvx
-bash install.sh
-```
-You can also install it with the following commands:
-```bash
- # 1. Install basic software
-apt update
-apt-get install -y --no-install-recommends \
-  gcc g++ git make wget python unzip
-
-# 2. Install arm gcc toolchains
-apt-get install -y --no-install-recommends \
-  g++-arm-linux-gnueabi gcc-arm-linux-gnueabi \
-  g++-arm-linux-gnueabihf gcc-arm-linux-gnueabihf \
-  gcc-aarch64-linux-gnu g++-aarch64-linux-gnu
-
-# 3. Install cmake 3.10 or above
-wget -c https://mms-res.cdn.bcebos.com/cmake-3.10.3-Linux-x86_64.tar.gz && \
-  tar xzf cmake-3.10.3-Linux-x86_64.tar.gz && \
-  mv cmake-3.10.3-Linux-x86_64 /opt/cmake-3.10 && \
-  ln -s /opt/cmake-3.10/bin/cmake /usr/bin/cmake && \
-  ln -s /opt/cmake-3.10/bin/ccmake /usr/bin/ccmake
-```
-
-## FastDeploy cross-compilation library compilation based on PaddleLite
-After setting up the cross-compilation environment, the compilation command is as follows:
-```bash
-# Download the latest source code
-git clone https://github.com/PaddlePaddle/FastDeploy.git
-cd FastDeploy  
-mkdir build && cd build
-
-# CMake configuration with RK toolchain
-cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/toolchain.cmake \
-      -DWITH_TIMVX=ON  \
-      -DTARGET_ABI=armhf \
-      -DCMAKE_INSTALL_PREFIX=fastdeploy-tmivx \
-      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
-      -Wno-dev ..
-
-# Build FastDeploy RV1126 C++ SDK
-make -j8
-make install
-```  
-After the compilation is complete, the fastdeploy-tmivx directory will be generated, indicating that the FastDeploy library based on PadddleLite TIM-VX has been compiled.
-
-## Prepare the Soc environment
-Before deployment, ensure that the version of the driver galcore.so of the Verisilicon Linux Kernel NPU meets the requirements. Before deployment, please log in to the development board, and enter the following command through the command line to query the NPU driver version. The recommended version of the Rockchip driver is: 6.4.6.5
-```bash
-dmesg | grep Galcore
-```  
-If the current version does not comply with the above, please read the following content carefully to ensure that the underlying NPU driver environment is correct.
-
-There are two ways to modify the current NPU driver version:
-1. Manually replace the NPU driver version. (recommend)
-2. flash the machine, and flash the firmware that meets the requirements of the NPU driver version.
-
-### Manually replace the NPU driver version
-1. Use the following command to download and decompress the PaddleLite demo, which provides ready-made driver files
-```bash
-wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
-tar -xf PaddleLite-generic-demo.tar.gz
-```
-2. Use `uname -a` to check `Linux Kernel` version, it is determined to be version 4.19.111.
-3. Upload `galcore.ko` under `PaddleLite-generic-demo/libs/PaddleLite/linux/armhf/lib/verisilicon_timvx/viv_sdk_6_4_6_5/lib/1126/4.19.111/` path to the development board.
-4. Log in to the development board, enter `sudo rmmod galcore` on the command line to uninstall the original driver, and enter `sudo insmod galcore.ko` to load the uploaded device driver. (Whether sudo is needed depends on the actual situation of the development board. For some adb-linked devices, please adb root in advance). If this step fails, go to method 2.
-5. Enter `dmesg | grep Galcore` in the development board to query the NPU driver version, and it is determined to be: 6.4.6.5
-
-### flash
-According to the specific development board model, ask the development board seller or the official website customer service for the firmware and flashing method corresponding to the 6.4.6.5 version of the NPU driver.
-
-For more details, please refer to: [PaddleLite prepares the device environment](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html#zhunbeishebeihuanjing)
-
-## Deployment example based on FastDeploy on RV1126
-1. For deploying the PaddleClas classification model on RV1126, please refer to: [C++ deployment example of PaddleClas classification model on RV1126](../../../examples/vision/classification/paddleclas/rv1126/README.md)
-
-2. For deploying PPYOLOE detection model on RV1126, please refer to: [C++ deployment example of PPYOLOE detection model on RV1126](../../../examples/vision/detection/paddledetection/rv1126/README.md)
-
-3. For deploying YOLOv5 detection model on RV1126, please refer to: [C++ Deployment Example of YOLOv5 Detection Model on RV1126](../../../examples/vision/detection/yolov5/rv1126/README.md)
-
-4. For deploying PP-LiteSeg segmentation model on RV1126, please refer to: [C++ Deployment Example of PP-LiteSeg Segmentation Model on RV1126](../../../examples/vision/segmentation/paddleseg/rv1126/README.md)
diff --git a/docs/en/build_and_install/xpu.md b/docs/en/build_and_install/xpu.md
deleted file mode 100755
index 403837e5d..000000000
--- a/docs/en/build_and_install/xpu.md
+++ /dev/null
@@ -1,78 +0,0 @@
-# How to Build KunlunXin XPU Deployment Environment
-
-FastDeploy supports deployment AI on KunlunXin XPU based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/kunlunxin_xpu.html#xpu)。
-
-This document describes how to compile the C++ FastDeploy library based on PaddleLite.
-
-The relevant compilation options are described as follows:  
-|Compile Options|Default Values|Description|Remarks|  
-|:---|:---|:---|:---|  
-| ENABLE_LITE_BACKEND | OFF | It needs to be set to ON when compiling the RK library| - |  
-| WITH_XPU | OFF | It needs to be set to ON when compiling the KunlunXin XPU library| - |
-| ENABLE_ORT_BACKEND | OFF | whether to intergrate ONNX Runtime backend | - |
-| ENABLE_PADDLE_BACKEND | OFF | whether to intergrate Paddle Inference backend | - |
-| ENABLE_OPENVINO_BACKEND | OFF | whether to intergrate OpenVINO backend | - |
-| ENABLE_VISION | OFF | whether to intergrate vision models | - |
-| ENABLE_TEXT | OFF | whether to intergrate text models | - |
-
-The configuration for third libraries(Optional, if the following option is not defined, the prebuilt third libraries will download automaticly while building FastDeploy).
-| Option                     | Description                                                                                           |
-| :---------------------- | :--------------------------------------------------------------------------------------------- |
-| ORT_DIRECTORY           | While ENABLE_ORT_BACKEND=ON, use ORT_DIRECTORY to specify your own ONNX Runtime library path.  |
-| OPENCV_DIRECTORY        | While ENABLE_VISION=ON, use OPENCV_DIRECTORY to specify your own OpenCV library path.     |
-| OPENVINO_DIRECTORY      |  While ENABLE_OPENVINO_BACKEND=ON, use OPENVINO_DIRECTORY to specify your own OpenVINO library path.    |
-
-For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
-
-## C++ FastDeploy library compilation based on PaddleLite
-- OS: Linux
-- gcc/g++: version >= 8.2
-- cmake: version >= 3.15
-
-It it recommend install OpenCV library manually, and define `-DOPENCV_DIRECTORY` to set path of OpenCV library(If the flag is not defined, a prebuilt OpenCV library will be downloaded automaticly while building FastDeploy, but the prebuilt OpenCV cannot support reading video file or other function e.g `imshow`)
-```
-sudo apt-get install libopencv-dev
-```
-
-The compilation command is as follows:
-```bash
-# Download the latest source code
-git clone https://github.com/PaddlePaddle/FastDeploy.git
-cd FastDeploy  
-mkdir build && cd build
-
-# CMake configuration with KunlunXin xpu toolchain
-cmake -DWITH_XPU=ON  \
-      -DWITH_GPU=OFF  \
-      -DENABLE_ORT_BACKEND=ON  \
-      -DENABLE_PADDLE_BACKEND=ON  \
-      -DCMAKE_INSTALL_PREFIX=fastdeploy-xpu \
-      -DENABLE_VISION=ON \
-      -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
-      ..
-
-# Build FastDeploy KunlunXin XPU C++ SDK
-make -j8
-make install
-```  
-After the compilation is complete, the fastdeploy-xpu directory will be generated, indicating that the PadddleLite-based FastDeploy library has been compiled.
-
-## Python compile
-The compilation command is as follows:
-```bash
-git clone https://github.com/PaddlePaddle/FastDeploy.git
-cd FastDeploy/python
-export WITH_XPU=ON
-export WITH_GPU=OFF
-export ENABLE_ORT_BACKEND=ON
-export ENABLE_PADDLE_BACKEND=ON
-export ENABLE_VISION=ON
-# The OPENCV_DIRECTORY is optional, if not exported, a prebuilt OpenCV library will be downloaded
-export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
-
-python setup.py build
-python setup.py bdist_wheel
-```  
-After the compilation is completed, the compiled `wheel` package will be generated in the `FastDeploy/python/dist` directory, just pip install it directly
-
-During the compilation process, if you modify the compilation parameters, in order to avoid the cache impact, you can delete the two subdirectories `build` and `.setuptools-cmake-build` under the `FastDeploy/python` directory and then recompile.
diff --git a/examples/vision/classification/paddleclas/cpp/README.md b/examples/vision/classification/paddleclas/cpp/README.md
old mode 100755
new mode 100644
index dff76da18..066340467
--- a/examples/vision/classification/paddleclas/cpp/README.md
+++ b/examples/vision/classification/paddleclas/cpp/README.md
@@ -30,10 +30,6 @@ wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/Ima
 ./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 1
 # GPU上TensorRT推理
 ./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 2
-# IPU推理
-./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 3
-# KunlunXin XPU推理
-./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 4
 ```
 
 以上命令只适用于Linux或MacOS, Windows下SDK的使用方式请参考:  
diff --git a/examples/vision/classification/paddleclas/cpp/infer.cc b/examples/vision/classification/paddleclas/cpp/infer.cc
old mode 100755
new mode 100644
index 244accfa7..bdd87ecdc
--- a/examples/vision/classification/paddleclas/cpp/infer.cc
+++ b/examples/vision/classification/paddleclas/cpp/infer.cc
@@ -96,32 +96,6 @@ void IpuInfer(const std::string& model_dir, const std::string& image_file) {
   std::cout << res.Str() << std::endl;
 }
 
-void XpuInfer(const std::string& model_dir, const std::string& image_file) {
-  auto model_file = model_dir + sep + "inference.pdmodel";
-  auto params_file = model_dir + sep + "inference.pdiparams";
-  auto config_file = model_dir + sep + "inference_cls.yaml";
-
-  auto option = fastdeploy::RuntimeOption();
-  option.UseXpu();
-  auto model = fastdeploy::vision::classification::PaddleClasModel(
-      model_file, params_file, config_file, option);
-  if (!model.Initialized()) {
-    std::cerr << "Failed to initialize." << std::endl;
-    return;
-  }
-
-  auto im = cv::imread(image_file);
-
-  fastdeploy::vision::ClassifyResult res;
-  if (!model.Predict(im, &res)) {
-    std::cerr << "Failed to predict." << std::endl;
-    return;
-  }
-
-  // print res
-  std::cout << res.Str() << std::endl;
-}
-
 void TrtInfer(const std::string& model_dir, const std::string& image_file) {
   auto model_file = model_dir + sep + "inference.pdmodel";
   auto params_file = model_dir + sep + "inference.pdiparams";
@@ -154,7 +128,7 @@ int main(int argc, char* argv[]) {
                  "e.g ./infer_demo ./ResNet50_vd ./test.jpeg 0"
               << std::endl;
     std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
-                 "with gpu; 2: run with gpu and use tensorrt backend; 3: run with ipu; 4: run with xpu."
+                 "with gpu; 2: run with gpu and use tensorrt backend."
               << std::endl;
     return -1;
   }
@@ -167,8 +141,6 @@ int main(int argc, char* argv[]) {
     TrtInfer(argv[1], argv[2]);
   } else if (std::atoi(argv[3]) == 3) {
     IpuInfer(argv[1], argv[2]);
-  } else if (std::atoi(argv[3]) == 4) {
-    XpuInfer(argv[1], argv[2]);
   }
   return 0;
 }
diff --git a/examples/vision/classification/paddleclas/python/README.md b/examples/vision/classification/paddleclas/python/README.md
old mode 100755
new mode 100644
index 5a1baff7f..9d17e6f65
--- a/examples/vision/classification/paddleclas/python/README.md
+++ b/examples/vision/classification/paddleclas/python/README.md
@@ -25,8 +25,6 @@ python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg -
 python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device gpu --use_trt True --topk 1
 # IPU推理（注意：IPU推理首次运行会有序列化模型的操作，有一定耗时，需要耐心等待）
 python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device ipu --topk 1
-# XPU推理
-python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device xpu --topk 1
 ```
 
 运行完成后返回结果如下所示
diff --git a/examples/vision/classification/paddleclas/python/infer.py b/examples/vision/classification/paddleclas/python/infer.py
old mode 100755
new mode 100644
index 3c150533c..0b2d35a21
--- a/examples/vision/classification/paddleclas/python/infer.py
+++ b/examples/vision/classification/paddleclas/python/infer.py
@@ -35,9 +35,6 @@ def build_option(args):
     if args.device.lower() == "ipu":
         option.use_ipu()
 
-    if args.device.lower() == "xpu":
-        option.use_xpu()
-
     if args.use_trt:
         option.use_trt_backend()
     return option
diff --git a/examples/vision/detection/yolov5/cpp/CMakeLists.txt b/examples/vision/detection/yolov5/cpp/CMakeLists.txt
old mode 100755
new mode 100644
index 2b3f8c54f..93540a7e8
--- a/examples/vision/detection/yolov5/cpp/CMakeLists.txt
+++ b/examples/vision/detection/yolov5/cpp/CMakeLists.txt
@@ -12,7 +12,3 @@ include_directories(${FASTDEPLOY_INCS})
 add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
 # 添加FastDeploy库依赖
 target_link_libraries(infer_demo ${FASTDEPLOY_LIBS})
-
-add_executable(infer_paddle_demo ${PROJECT_SOURCE_DIR}/infer_paddle_model.cc)
-# 添加FastDeploy库依赖
-target_link_libraries(infer_paddle_demo ${FASTDEPLOY_LIBS})
diff --git a/examples/vision/detection/yolov5/cpp/README.md b/examples/vision/detection/yolov5/cpp/README.md
old mode 100755
new mode 100644
index 581f1c49b..ece3826a5
--- a/examples/vision/detection/yolov5/cpp/README.md
+++ b/examples/vision/detection/yolov5/cpp/README.md
@@ -12,33 +12,16 @@
 ```bash
 mkdir build
 cd build
-# 下载 FastDeploy 预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
+# 下载FastDeploy预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
 wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz
 tar xvf fastdeploy-linux-x64-x.x.x.tgz
 cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
 make -j
-#下载官方转换好的 yolov5 Paddle 模型文件和测试图片
-wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s_infer.tar
-tar -xvf yolov5s_infer.tar
-wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
-
-
-# CPU推理
-./infer_paddle_demo yolov5s_infer 000000014439.jpg 0
-# GPU推理
-./infer_paddle_demo yolov5s_infer 000000014439.jpg 1
-# GPU上TensorRT推理
-./infer_paddle_demo yolov5s_infer 000000014439.jpg 2
-# XPU推理
-./infer_paddle_demo yolov5s_infer 000000014439.jpg 3
-```
-
-上述的模型为 Paddle 模型的推理，如果想要做 ONNX 模型的推理，可以按照如下步骤：
-```bash
-# 1. 下载官方转换好的 yolov5 ONNX 模型文件和测试图片
+#下载官方转换好的yolov5模型文件和测试图片
 wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
+
 # CPU推理
 ./infer_demo yolov5s.onnx 000000014439.jpg 0
 # GPU推理
@@ -46,6 +29,7 @@ wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/0000000
 # GPU上TensorRT推理
 ./infer_demo yolov5s.onnx 000000014439.jpg 2
 ```
+
 运行完成可视化结果如下图所示
 
 <img width="640" src="https://user-images.githubusercontent.com/67993288/184309358-d803347a-8981-44b6-b589-4608021ad0f4.jpg">
diff --git a/examples/vision/detection/yolov5/cpp/infer.cc b/examples/vision/detection/yolov5/cpp/infer.cc
old mode 100755
new mode 100644
index fb20686de..1c3907918
--- a/examples/vision/detection/yolov5/cpp/infer.cc
+++ b/examples/vision/detection/yolov5/cpp/infer.cc
@@ -102,4 +102,4 @@ int main(int argc, char* argv[]) {
     TrtInfer(argv[1], argv[2]);
   }
   return 0;
-}
\ No newline at end of file
+}
diff --git a/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc b/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
deleted file mode 100755
index d5692ce7c..000000000
--- a/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
+++ /dev/null
@@ -1,154 +0,0 @@
-// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//     http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-#include "fastdeploy/vision.h"
-#ifdef WIN32
-const char sep = '\\';
-#else
-const char sep = '/';
-#endif
-
-void CpuInfer(const std::string& model_dir, const std::string& image_file) {
-  auto model_file = model_dir + sep + "model.pdmodel";
-  auto params_file = model_dir + sep + "model.pdiparams";
-  fastdeploy::RuntimeOption option;
-  option.UseCpu();
-  auto model = fastdeploy::vision::detection::YOLOv5(
-      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
-  if (!model.Initialized()) {
-    std::cerr << "Failed to initialize." << std::endl;
-    return;
-  }
-
-  auto im = cv::imread(image_file);
-
-  fastdeploy::vision::DetectionResult res;
-  if (!model.Predict(im, &res)) {
-    std::cerr << "Failed to predict." << std::endl;
-    return;
-  }
-  std::cout << res.Str() << std::endl;
-
-  auto vis_im = fastdeploy::vision::VisDetection(im, res);
-
-  cv::imwrite("vis_result.jpg", vis_im);
-  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
-}
-
-void GpuInfer(const std::string& model_dir, const std::string& image_file) {
-  auto model_file = model_dir + sep + "model.pdmodel";
-  auto params_file = model_dir + sep + "model.pdiparams";
-  auto option = fastdeploy::RuntimeOption();
-  option.UseGpu();
-  auto model = fastdeploy::vision::detection::YOLOv5(
-      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
-  if (!model.Initialized()) {
-    std::cerr << "Failed to initialize." << std::endl;
-    return;
-  }
-
-  auto im = cv::imread(image_file);
-
-  fastdeploy::vision::DetectionResult res;
-  if (!model.Predict(im, &res)) {
-    std::cerr << "Failed to predict." << std::endl;
-    return;
-  }
-  std::cout << res.Str() << std::endl;
-
-  auto vis_im = fastdeploy::vision::VisDetection(im, res);
-
-  cv::imwrite("vis_result.jpg", vis_im);
-  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
-}
-
-void TrtInfer(const std::string& model_dir, const std::string& image_file) {
-  auto model_file = model_dir + sep + "model.pdmodel";
-  auto params_file = model_dir + sep + "model.pdiparams";
-  auto option = fastdeploy::RuntimeOption();
-  option.UseGpu();
-  option.UseTrtBackend();
-  option.SetTrtInputShape("images", {1, 3, 640, 640});
-  auto model = fastdeploy::vision::detection::YOLOv5(
-      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
-
-  if (!model.Initialized()) {
-    std::cerr << "Failed to initialize." << std::endl;
-    return;
-  }
-
-  auto im = cv::imread(image_file);
-
-  fastdeploy::vision::DetectionResult res;
-  if (!model.Predict(im, &res)) {
-    std::cerr << "Failed to predict." << std::endl;
-    return;
-  }
-  std::cout << res.Str() << std::endl;
-
-  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im, res);
-  cv::imwrite("vis_result.jpg", vis_im);
-  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
-}
-
-void XpuInfer(const std::string& model_dir, const std::string& image_file) {
-  auto model_file = model_dir + sep + "model.pdmodel";
-  auto params_file = model_dir + sep + "model.pdiparams";
-  fastdeploy::RuntimeOption option;
-  option.UseXpu();
-  auto model = fastdeploy::vision::detection::YOLOv5(
-      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
-
-  if (!model.Initialized()) {
-    std::cerr << "Failed to initialize." << std::endl;
-    return;
-  }
-
-  auto im = cv::imread(image_file);
-
-  fastdeploy::vision::DetectionResult res;
-  if (!model.Predict(im, &res)) {
-    std::cerr << "Failed to predict." << std::endl;
-    return;
-  }
-  std::cout << res.Str() << std::endl;
-
-  auto vis_im = fastdeploy::vision::VisDetection(im, res);
-
-  cv::imwrite("vis_result.jpg", vis_im);
-  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
-}
-
-int main(int argc, char* argv[]) {
-  if (argc < 4) {
-    std::cout << "Usage: infer_demo path/to/model path/to/image run_option, "
-                 "e.g ./infer_model ./yolov5s_infer ./test.jpeg 0"
-              << std::endl;
-    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
-                 "with gpu; 2: run with gpu and use tensorrt backend; 3: run with KunlunXin XPU."
-              << std::endl;
-    return -1;
-  }
-
-  if (std::atoi(argv[3]) == 0) {
-    CpuInfer(argv[1], argv[2]);
-  } else if (std::atoi(argv[3]) == 1) {
-    GpuInfer(argv[1], argv[2]);
-  } else if (std::atoi(argv[3]) == 2) {
-    TrtInfer(argv[1], argv[2]);
-  } else if (std::atoi(argv[3]) == 3) {
-    XpuInfer(argv[1], argv[2]);
-  }
-  return 0;
-}
diff --git a/examples/vision/detection/yolov5/python/README.md b/examples/vision/detection/yolov5/python/README.md
old mode 100755
new mode 100644
index 83f6ed781..4f47b3084
--- a/examples/vision/detection/yolov5/python/README.md
+++ b/examples/vision/detection/yolov5/python/README.md
@@ -13,18 +13,15 @@ git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd examples/vision/detection/yolov5/python/
 
 #下载yolov5模型文件和测试图片
-wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s_infer.tar
-tar -xf yolov5s_infer.tar
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
 # CPU推理
-python infer.py --model yolov5s_infer --image 000000014439.jpg --device cpu
+python infer.py --model yolov5s.onnx --image 000000014439.jpg --device cpu
 # GPU推理
-python infer.py --model yolov5s_infer --image 000000014439.jpg --device gpu
+python infer.py --model yolov5s.onnx --image 000000014439.jpg --device gpu
 # GPU上使用TensorRT推理
-python infer.py --model yolov5s_infer --image 000000014439.jpg --device gpu --use_trt True
-# XPU推理
-python infer.py --model yolov5s_infer --image 000000014439.jpg --device xpu
+python infer.py --model yolov5s.onnx --image 000000014439.jpg --device gpu --use_trt True
 ```
 
 运行完成可视化结果如下图所示
diff --git a/examples/vision/detection/yolov5/python/infer.py b/examples/vision/detection/yolov5/python/infer.py
old mode 100755
new mode 100644
index b155af0ed..462740e9c
--- a/examples/vision/detection/yolov5/python/infer.py
+++ b/examples/vision/detection/yolov5/python/infer.py
@@ -1,20 +1,20 @@
 import fastdeploy as fd
 import cv2
-import os
 
 
 def parse_arguments():
     import argparse
     import ast
     parser = argparse.ArgumentParser()
-    parser.add_argument("--model", default=None, help="Path of yolov5 model.")
+    parser.add_argument(
+        "--model", default=None, help="Path of yolov5 onnx model.")
     parser.add_argument(
         "--image", default=None, help="Path of test image file.")
     parser.add_argument(
         "--device",
         type=str,
         default='cpu',
-        help="Type of inference device, support 'cpu' or 'gpu' or 'xpu'.")
+        help="Type of inference device, support 'cpu' or 'gpu'.")
     parser.add_argument(
         "--use_trt",
         type=ast.literal_eval,
@@ -25,8 +25,6 @@ def parse_arguments():
 
 def build_option(args):
     option = fd.RuntimeOption()
-    if args.device.lower() == "xpu":
-        option.use_xpu()
 
     if args.device.lower() == "gpu":
         option.use_gpu()
@@ -39,15 +37,14 @@ def build_option(args):
 
 args = parse_arguments()
 
+if args.model is None:
+    model = fd.download_model(name='YOLOv5s')
+else:
+    model = args.model
+
 # 配置runtime，加载模型
 runtime_option = build_option(args)
-model_file = os.path.join(args.model, "model.pdmodel")
-params_file = os.path.join(args.model, "model.pdiparams")
-model = fd.vision.detection.YOLOv5(
-    model_file,
-    params_file,
-    runtime_option=runtime_option,
-    model_format=fd.ModelFormat.PADDLE)
+model = fd.vision.detection.YOLOv5(model, runtime_option=runtime_option)
 
 # 预测图片检测结果
 if args.image is None:
diff --git a/fastdeploy/backends/lite/lite_backend.cc b/fastdeploy/backends/lite/lite_backend.cc
index 20afa5e28..7e3e09f8d 100755
--- a/fastdeploy/backends/lite/lite_backend.cc
+++ b/fastdeploy/backends/lite/lite_backend.cc
@@ -43,33 +43,24 @@ void LiteBackend::BuildOption(const LiteBackendOption& option) {
   option_ = option;
   std::vector<paddle::lite_api::Place> valid_places;
   if (option_.enable_int8) {
-    if(option_.enable_xpu) {
-      valid_places.push_back(
-          paddle::lite_api::Place{TARGET(kXPU), PRECISION(kInt8)});
-    } else {
-      valid_places.push_back(
+    valid_places.push_back(
         paddle::lite_api::Place{TARGET(kARM), PRECISION(kInt8)});
-    }
     FDINFO << "Lite::Backend enable_int8 option is ON ! Lite::Backend will "
            << "inference with int8 precision!" << std::endl;    
   }
   if (option_.enable_fp16) {
-    if(option_.enable_xpu){
+    paddle::lite_api::MobileConfig check_fp16_config;
+    // Determine whether the device supports the FP16
+    // instruction set (or whether it is an arm device
+    // of the armv8.2 architecture)
+    supported_fp16_ = check_fp16_config.check_fp16_valid();
+    if (supported_fp16_) {
       valid_places.push_back(
-          paddle::lite_api::Place{TARGET(kXPU), PRECISION(kFP16)});
+          paddle::lite_api::Place{TARGET(kARM), PRECISION(kFP16)});
+      FDINFO << "Your device is supported fp16 ! Lite::Backend will "
+             << "inference with fp16 precision!" << std::endl;    
     } else {
-      paddle::lite_api::MobileConfig check_fp16_config;
-      // Determine whether the device supports the FP16
-      // instruction set (or whether it is an arm device
-      // of the armv8.2 architecture)
-      supported_fp16_ = check_fp16_config.check_fp16_valid();
-      if (supported_fp16_) {
-        valid_places.push_back(
-            paddle::lite_api::Place{TARGET(kARM), PRECISION(kFP16)});
-        FDINFO << "The device supports FP16, Lite::Backend will inference with FP16 precision." << std::endl;    
-      } else {
-        FDWARNING << "The device doesn't support FP16, will fallback to FP32.";
-      }
+      FDWARNING << "This device is not supported fp16, will skip fp16 option.";
     }
   }
   if (!option_.nnadapter_subgraph_partition_config_path.empty()) {
@@ -90,24 +81,8 @@ void LiteBackend::BuildOption(const LiteBackendOption& option) {
     valid_places.push_back(
         paddle::lite_api::Place{TARGET(kARM), PRECISION(kInt8)});
   }
-  
-  if(option_.enable_xpu){
-    valid_places.push_back(
-      paddle::lite_api::Place{TARGET(kXPU), PRECISION(kFloat)});
-    valid_places.push_back(
-      paddle::lite_api::Place{TARGET(kX86), PRECISION(kFloat)});
-    config_.set_xpu_dev_per_thread(option_.device_id);
-    config_.set_xpu_workspace_l3_size_per_thread(option_.xpu_l3_workspace_size);
-    config_.set_xpu_l3_cache_method(option_.xpu_l3_workspace_size, option_.xpu_locked);
-    config_.set_xpu_conv_autotune(option_.xpu_autotune, option_.xpu_autotune_file);
-    config_.set_xpu_multi_encoder_method(option_.xpu_precision, option_.xpu_adaptive_seqlen);
-    if (option_.xpu_enable_multi_stream) {
-      config_.enable_xpu_multi_stream();
-    }
-  } else {
-    valid_places.push_back(
+  valid_places.push_back(
       paddle::lite_api::Place{TARGET(kARM), PRECISION(kFloat)});
-  }
   config_.set_valid_places(valid_places);
   if (option_.threads > 0) {
     config_.set_threads(option_.threads);
@@ -185,9 +160,7 @@ bool LiteBackend::InitFromPaddle(const std::string& model_file,
     auto shape = tensor->shape();
     info.shape.assign(shape.begin(), shape.end());
     info.name = output_names[i];
-    if(!option_.enable_xpu){
-      info.dtype = LiteDataTypeToFD(tensor->precision());
-    }
+    info.dtype = LiteDataTypeToFD(tensor->precision());
     outputs_desc_.emplace_back(info);
   }
 
@@ -266,9 +239,6 @@ bool LiteBackend::Infer(std::vector<FDTensor>& inputs,
   outputs->resize(outputs_desc_.size());
   for (size_t i = 0; i < outputs_desc_.size(); ++i) {
     auto tensor = predictor_->GetOutput(i);
-    if(outputs_desc_[i].dtype != LiteDataTypeToFD(tensor->precision())){
-      outputs_desc_[i].dtype = LiteDataTypeToFD(tensor->precision());
-    }
     (*outputs)[i].Resize(tensor->shape(), outputs_desc_[i].dtype,
                          outputs_desc_[i].name);
     memcpy((*outputs)[i].MutableData(), tensor->data<void>(),
diff --git a/fastdeploy/backends/lite/lite_backend.h b/fastdeploy/backends/lite/lite_backend.h
index 0221f507f..279acf5df 100755
--- a/fastdeploy/backends/lite/lite_backend.h
+++ b/fastdeploy/backends/lite/lite_backend.h
@@ -45,15 +45,6 @@ struct LiteBackendOption {
   // Such as fp16, different device target (kARM/kXPU/kNPU/...)
   std::string nnadapter_subgraph_partition_config_path = "";
   bool enable_timvx = false;
-  bool enable_xpu = false;
-  int device_id = 0;
-  int xpu_l3_workspace_size = 0xfffc00;
-  bool xpu_locked = false;
-  bool xpu_autotune = true;
-  std::string xpu_autotune_file = "";
-  std::string xpu_precision = "int16";
-  bool xpu_adaptive_seqlen = false;
-  bool xpu_enable_multi_stream = false;
 };
 
 // Convert data type from paddle lite to fastdeploy
diff --git a/fastdeploy/core/fd_type.cc b/fastdeploy/core/fd_type.cc
index 3624b732d..ba3319dbc 100755
--- a/fastdeploy/core/fd_type.cc
+++ b/fastdeploy/core/fd_type.cc
@@ -62,9 +62,6 @@ std::string Str(const Device& d) {
     case Device::TIMVX:
       out = "Device::TIMVX";
       break;
-    case Device::XPU:
-      out = "Device::XPU";
-      break;
     default:
       out = "Device::UNKOWN";
   }
@@ -85,9 +82,6 @@ std::ostream& operator<<(std::ostream& out,const Device& d){
   case Device::TIMVX:
     out << "Device::TIMVX";
     break;
-  case Device::XPU:
-    out << "Device::XPU";
-    break;
   default:
     out << "Device::UNKOWN";
   }
diff --git a/fastdeploy/core/fd_type.h b/fastdeploy/core/fd_type.h
index d39c56fdf..ba18d8e36 100755
--- a/fastdeploy/core/fd_type.h
+++ b/fastdeploy/core/fd_type.h
@@ -22,7 +22,7 @@
 
 namespace fastdeploy {
 
-enum FASTDEPLOY_DECL Device { CPU, GPU, RKNPU, IPU, TIMVX, XPU};
+enum FASTDEPLOY_DECL Device { CPU, GPU, RKNPU, IPU, TIMVX};
 
 FASTDEPLOY_DECL std::string Str(const Device& d);
 
diff --git a/fastdeploy/fastdeploy_model.cc b/fastdeploy/fastdeploy_model.cc
index 4d7a8e364..ad8c1329d 100755
--- a/fastdeploy/fastdeploy_model.cc
+++ b/fastdeploy/fastdeploy_model.cc
@@ -51,7 +51,6 @@ bool FastDeployModel::InitRuntimeWithSpecifiedBackend() {
   bool use_ipu = (runtime_option.device == Device::IPU);
   bool use_rknpu = (runtime_option.device == Device::RKNPU);
   bool use_timvx = (runtime_option.device == Device::TIMVX);
-  bool use_xpu = (runtime_option.device == Device::XPU);
 
   if (use_gpu) {
     if (!IsSupported(valid_gpu_backends, runtime_option.backend)) {
@@ -68,11 +67,6 @@ bool FastDeployModel::InitRuntimeWithSpecifiedBackend() {
       FDERROR << "The valid timvx backends of model " << ModelName() << " are " << Str(valid_timvx_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
       return false;
     }
-  } else if (use_xpu) {
-    if (!IsSupported(valid_xpu_backends, runtime_option.backend)) {
-      FDERROR << "The valid xpu backends of model " << ModelName() << " are " << Str(valid_xpu_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
-      return false;
-    }
   } else if(use_ipu) {
     if (!IsSupported(valid_ipu_backends, runtime_option.backend)) {
       FDERROR << "The valid ipu backends of model " << ModelName() << " are " << Str(valid_ipu_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
@@ -108,8 +102,6 @@ bool FastDeployModel::InitRuntimeWithSpecifiedDevice() {
     return CreateRKNPUBackend();
   } else if (runtime_option.device == Device::TIMVX) {
     return CreateTimVXBackend();
-  } else if (runtime_option.device == Device::XPU) {
-    return CreateXPUBackend();
   } else if (runtime_option.device == Device::IPU) {
 #ifdef WITH_IPU
     return CreateIpuBackend();
@@ -119,7 +111,7 @@ bool FastDeployModel::InitRuntimeWithSpecifiedDevice() {
     return false;
 #endif
   }
-  FDERROR << "Only support CPU/GPU/IPU/RKNPU/TIMVX/XPU now." << std::endl;
+  FDERROR << "Only support CPU/GPU/IPU/RKNPU/TIMVX now." << std::endl;
   return false;
 }
 
@@ -233,29 +225,6 @@ bool FastDeployModel::CreateTimVXBackend() {
   return false;
 }
 
-bool FastDeployModel::CreateXPUBackend() {
-  if (valid_xpu_backends.size() == 0) {
-    FDERROR << "There's no valid xpu backends for model: " << ModelName()
-            << std::endl;
-    return false;
-  }
-
-  for (size_t i = 0; i < valid_xpu_backends.size(); ++i) {
-    if (!IsBackendAvailable(valid_xpu_backends[i])) {
-      continue;
-    }
-    runtime_option.backend = valid_xpu_backends[i];
-    runtime_ = std::unique_ptr<Runtime>(new Runtime());
-    if (!runtime_->Init(runtime_option)) {
-      return false;
-    }
-    runtime_initialized_ = true;
-    return true;
-  }
-  FDERROR << "Found no valid backend for model: " << ModelName() << std::endl;
-  return false;
-}
-
 bool FastDeployModel::CreateIpuBackend() {
   if (valid_ipu_backends.size() == 0) {
     FDERROR << "There's no valid ipu backends for model: " << ModelName()
diff --git a/fastdeploy/fastdeploy_model.h b/fastdeploy/fastdeploy_model.h
index 5c8809196..5a6efba09 100755
--- a/fastdeploy/fastdeploy_model.h
+++ b/fastdeploy/fastdeploy_model.h
@@ -45,9 +45,6 @@ class FASTDEPLOY_DECL FastDeployModel {
   /** Model's valid timvx backends. This member defined all the timvx backends have successfully tested for the model
    */
   std::vector<Backend> valid_timvx_backends = {};
-  /** Model's valid KunlunXin xpu backends. This member defined all the KunlunXin xpu backends have successfully tested for the model
-   */
-  std::vector<Backend> valid_xpu_backends = {};
   /** Model's valid hardware backends. This member defined all the gpu backends have successfully tested for the model
    */
   std::vector<Backend> valid_rknpu_backends = {};
@@ -146,7 +143,6 @@ class FASTDEPLOY_DECL FastDeployModel {
   bool CreateIpuBackend();
   bool CreateRKNPUBackend();
   bool CreateTimVXBackend();
-  bool CreateXPUBackend();
 
   std::shared_ptr<Runtime> runtime_;
   bool runtime_initialized_ = false;
diff --git a/fastdeploy/pybind/runtime.cc b/fastdeploy/pybind/runtime.cc
old mode 100755
new mode 100644
index d0cb0b5f8..75767c665
--- a/fastdeploy/pybind/runtime.cc
+++ b/fastdeploy/pybind/runtime.cc
@@ -23,7 +23,6 @@ void BindRuntime(pybind11::module& m) {
       .def("use_gpu", &RuntimeOption::UseGpu)
       .def("use_cpu", &RuntimeOption::UseCpu)
       .def("use_rknpu2", &RuntimeOption::UseRKNPU2)
-      .def("use_xpu", &RuntimeOption::UseXpu)
       .def("set_external_stream", &RuntimeOption::SetExternalStream)
       .def("set_cpu_thread_num", &RuntimeOption::SetCpuThreadNum)
       .def("use_paddle_backend", &RuntimeOption::UsePaddleBackend)
@@ -101,21 +100,7 @@ void BindRuntime(pybind11::module& m) {
       .def_readwrite("ipu_available_memory_proportion",
                      &RuntimeOption::ipu_available_memory_proportion)
       .def_readwrite("ipu_enable_half_partial",
-                     &RuntimeOption::ipu_enable_half_partial)
-      .def_readwrite("xpu_l3_workspace_size",
-                     &RuntimeOption::xpu_l3_workspace_size)
-      .def_readwrite("xpu_locked",
-                     &RuntimeOption::xpu_locked)
-      .def_readwrite("xpu_autotune",
-                     &RuntimeOption::xpu_autotune)
-      .def_readwrite("xpu_autotune_file",
-                     &RuntimeOption::xpu_autotune_file)
-      .def_readwrite("xpu_precision",
-                     &RuntimeOption::xpu_precision)
-      .def_readwrite("xpu_adaptive_seqlen",
-                     &RuntimeOption::xpu_adaptive_seqlen)
-      .def_readwrite("xpu_enable_multi_stream",
-                     &RuntimeOption::xpu_enable_multi_stream);                              
+                     &RuntimeOption::ipu_enable_half_partial);
 
   pybind11::class_<TensorInfo>(m, "TensorInfo")
       .def_readwrite("name", &TensorInfo::name)
diff --git a/fastdeploy/runtime.cc b/fastdeploy/runtime.cc
old mode 100755
new mode 100644
index 565c10607..1a51cebea
--- a/fastdeploy/runtime.cc
+++ b/fastdeploy/runtime.cc
@@ -236,26 +236,7 @@ void RuntimeOption::UseRKNPU2(fastdeploy::rknpu2::CpuName rknpu2_name,
 void RuntimeOption::UseTimVX() {
   enable_timvx = true;
   device = Device::TIMVX;
-}
-
-void RuntimeOption::UseXpu(int xpu_id, 
-                          int l3_workspace_size,
-                          bool locked,
-                          bool autotune,
-                          const std::string &autotune_file,
-                          const std::string &precision,
-                          bool adaptive_seqlen,
-                          bool enable_multi_stream) {
-  enable_xpu = true;
-  device_id = xpu_id;
-  xpu_l3_workspace_size = l3_workspace_size;
-  xpu_locked=locked;
-  xpu_autotune=autotune;
-  xpu_autotune_file=autotune_file;
-  xpu_precision = precision;
-  xpu_adaptive_seqlen=adaptive_seqlen;
-  xpu_enable_multi_stream=enable_multi_stream;
-  device = Device::XPU;
+  UseLiteBackend();
 }
 
 void RuntimeOption::SetExternalStream(void* external_stream) {
@@ -551,8 +532,8 @@ bool Runtime::Init(const RuntimeOption& _option) {
     FDINFO << "Runtime initialized with Backend::OPENVINO in "
            << Str(option.device) << "." << std::endl;
   } else if (option.backend == Backend::LITE) {
-    FDASSERT(option.device == Device::CPU || option.device == Device::TIMVX || option.device == Device::XPU,
-             "Backend::LITE only supports Device::CPU/Device::TIMVX/Device::XPU.");
+    FDASSERT(option.device == Device::CPU || option.device == Device::TIMVX,
+             "Backend::LITE only supports Device::CPU/Device::TIMVX.");
     CreateLiteBackend();
     FDINFO << "Runtime initialized with Backend::LITE in " << Str(option.device)
            << "." << std::endl;
@@ -803,16 +784,6 @@ void Runtime::CreateLiteBackend() {
   lite_option.nnadapter_subgraph_partition_config_path =
       option.lite_nnadapter_subgraph_partition_config_path;
   lite_option.enable_timvx = option.enable_timvx;
-  lite_option.enable_xpu = option.enable_xpu;
-  lite_option.device_id  = option.device_id;
-  lite_option.xpu_l3_workspace_size  = option.xpu_l3_workspace_size;
-  lite_option.xpu_locked = option.xpu_locked;
-  lite_option.xpu_autotune = option.xpu_autotune;
-  lite_option.xpu_autotune_file = option.xpu_autotune_file;
-  lite_option.xpu_precision  = option.xpu_precision;
-  lite_option.xpu_adaptive_seqlen = option.xpu_adaptive_seqlen;
-  lite_option.xpu_enable_multi_stream = option.xpu_enable_multi_stream;
-
   FDASSERT(option.model_format == ModelFormat::PADDLE,
            "LiteBackend only support model format of ModelFormat::PADDLE");
   backend_ = utils::make_unique<LiteBackend>();
diff --git a/fastdeploy/runtime.h b/fastdeploy/runtime.h
index 064be2fce..9c22c929f 100755
--- a/fastdeploy/runtime.h
+++ b/fastdeploy/runtime.h
@@ -102,37 +102,6 @@ struct FASTDEPLOY_DECL RuntimeOption {
   /// Use TimVX to inference
   void UseTimVX();
 
-  ///
-  /// \brief Turn on XPU.
-  ///
-  /// \param xpu_id the XPU card to use (default is 0).
-  /// \param l3_workspace_size The size of the video memory allocated by the l3
-  ///         cache, the maximum is 16M.
-  /// \param locked Whether the allocated L3 cache can be locked. If false,
-  ///       it means that the L3 cache is not locked, and the allocated L3
-  ///       cache can be shared by multiple models, and multiple models
-  ///       sharing the L3 cache will be executed sequentially on the card.
-  /// \param autotune Whether to autotune the conv operator in the model. If
-  ///       true, when the conv operator of a certain dimension is executed
-  ///       for the first time, it will automatically search for a better
-  ///       algorithm to improve the performance of subsequent conv operators
-  ///       of the same dimension.
-  /// \param autotune_file Specify the path of the autotune file. If
-  ///       autotune_file is specified, the algorithm specified in the
-  ///       file will be used and autotune will not be performed again.
-  /// \param precision Calculation accuracy of multi_encoder
-  /// \param adaptive_seqlen Is the input of multi_encoder variable length
-  /// \param enable_multi_stream Whether to enable the multi stream of xpu.
-  ///
-  void UseXpu(int xpu_id = 0,
-              int l3_workspace_size = 0xfffc00,
-              bool locked = false,
-              bool autotune = true,
-              const std::string& autotune_file = "",
-              const std::string& precision = "int16",
-              bool adaptive_seqlen = false,
-              bool enable_multi_stream = false);
-
   void SetExternalStream(void* external_stream);
 
   /*
@@ -385,7 +354,6 @@ struct FASTDEPLOY_DECL RuntimeOption {
   std::string lite_optimized_model_dir = "";
   std::string lite_nnadapter_subgraph_partition_config_path = "";
   bool enable_timvx = false;
-  bool enable_xpu = false;
 
   // ======Only for Trt Backend=======
   std::map<std::string, std::vector<int32_t>> trt_max_shape;
@@ -418,15 +386,6 @@ struct FASTDEPLOY_DECL RuntimeOption {
   fastdeploy::rknpu2::CoreMask rknpu2_core_mask_ =
       fastdeploy::rknpu2::CoreMask::RKNN_NPU_CORE_AUTO;
 
-  // ======Only for XPU Backend=======
-  int xpu_l3_workspace_size = 0xfffc00;
-  bool xpu_locked = false;
-  bool xpu_autotune = true;
-  std::string xpu_autotune_file = "";
-  std::string xpu_precision = "int16";
-  bool xpu_adaptive_seqlen = false;
-  bool xpu_enable_multi_stream = false;
-
   std::string model_file = "";   // Path of model file
   std::string params_file = "";  // Path of parameters file, can be empty
   // format of input model
diff --git a/fastdeploy/vision/classification/ppcls/model.cc b/fastdeploy/vision/classification/ppcls/model.cc
index e1b8d5249..5065bbfc2 100755
--- a/fastdeploy/vision/classification/ppcls/model.cc
+++ b/fastdeploy/vision/classification/ppcls/model.cc
@@ -29,7 +29,6 @@ PaddleClasModel::PaddleClasModel(const std::string& model_file,
                           Backend::LITE};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     valid_timvx_backends = {Backend::LITE};
-    valid_xpu_backends = {Backend::LITE};
     valid_ipu_backends = {Backend::PDINFER};
   } else if (model_format == ModelFormat::ONNX) {
     valid_cpu_backends = {Backend::ORT, Backend::OPENVINO};
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
index 6dcda3b77..238c1c465 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
@@ -72,11 +72,10 @@ class FASTDEPLOY_DECL RKYOLOPostprocessor {
   }
 
   // Set Anchor
-  void SetAnchor(std::vector<int> anchors, int anchor_per_branch) {
+  void SetAnchor(std::vector<int> anchors,int anchor_per_branch){
       anchors_ = anchors;
       anchor_per_branch_ = anchor_per_branch;
-  }
-
+  };
  private:
   std::vector<int> anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
                                45, 59, 119, 116, 90, 156, 198, 373, 326};
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/utils.h b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
index 1fa533082..1d28b5f0e 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/utils.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
@@ -31,4 +31,4 @@ int NMS(int valid_count, std::vector<float>& output_locations,
 
 }  // namespace detection
 }  // namespace vision
-}  // namespace fastdeploy
+}  // namespace fastdeploy
\ No newline at end of file
diff --git a/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc b/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
index d1bb31f22..92d53dd10 100755
--- a/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
+++ b/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
@@ -27,7 +27,6 @@ YOLOv5::YOLOv5(const std::string& model_file, const std::string& params_file,
   } else {
     valid_cpu_backends = {Backend::PDINFER, Backend::ORT, Backend::LITE};
     valid_gpu_backends = {Backend::PDINFER, Backend::ORT, Backend::TRT};
-    valid_xpu_backends = {Backend::LITE};
     valid_timvx_backends = {Backend::LITE};
   }
   runtime_option = custom_option;
diff --git a/fastdeploy/vision/detection/ppdet/model.h b/fastdeploy/vision/detection/ppdet/model.h
index 090c99de7..5175bc4e6 100755
--- a/fastdeploy/vision/detection/ppdet/model.h
+++ b/fastdeploy/vision/detection/ppdet/model.h
@@ -185,7 +185,7 @@ class FASTDEPLOY_DECL PaddleYOLOv5 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::ORT, Backend::PDINFER};
+    valid_cpu_backends = {Backend::ORT,Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
@@ -201,7 +201,7 @@ class FASTDEPLOY_DECL PaddleYOLOv6 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::OPENVINO, Backend::ORT, Backend::PDINFER};
+    valid_cpu_backends = {Backend::OPENVINO, Backend::ORT,Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
@@ -217,7 +217,7 @@ class FASTDEPLOY_DECL PaddleYOLOv7 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::ORT, Backend::PDINFER};
+    valid_cpu_backends = {Backend::ORT,Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
diff --git a/python/fastdeploy/runtime.py b/python/fastdeploy/runtime.py
index f9334efbf..6461da66d 100755
--- a/python/fastdeploy/runtime.py
+++ b/python/fastdeploy/runtime.py
@@ -245,34 +245,6 @@ class RuntimeOption:
             return
         return self._option.use_gpu(device_id)
 
-    def use_xpu(self,
-                device_id=0,
-                l3_workspace_size=16 * 1024 * 1024,
-                locked=False,
-                autotune=True,
-                autotune_file="",
-                precision="int16",
-                adaptive_seqlen=False,
-                enable_multi_stream=False):
-        """Inference with XPU
-
-        :param device_id: (int)The index of XPU will be used for inference, default 0
-        :param l3_workspace_size: (int)The size of the video memory allocated by the l3 cache, the maximum is 16M, default 16M
-        :param locked: (bool)Whether the allocated L3 cache can be locked. If false, it means that the L3 cache is not locked,
-                        and the allocated L3 cache can be shared by multiple models, and multiple models
-        :param autotune: (bool)Whether to autotune the conv operator in the model.
-                        If true, when the conv operator of a certain dimension is executed for the first time,
-                        it will automatically search for a better algorithm to improve the performance of subsequent conv operators of the same dimension.
-        :param autotune_file: (str)Specify the path of the autotune file. If autotune_file is specified,
-                        the algorithm specified in the file will be used and autotune will not be performed again.
-        :param precision: (str)Calculation accuracy of multi_encoder
-        :param adaptive_seqlen: (bool)adaptive_seqlen Is the input of multi_encoder variable length
-        :param enable_multi_stream: (bool)Whether to enable the multi stream of xpu.
-        """
-        return self._option.use_xpu(device_id, l3_workspace_size, locked,
-                                    autotune, autotune_file, precision,
-                                    adaptive_seqlen, enable_multi_stream)
-
     def use_cpu(self):
         """Inference with CPU
         """
diff --git a/python/setup.py b/python/setup.py
index 19a857678..b4dc111c6 100755
--- a/python/setup.py
+++ b/python/setup.py
@@ -65,13 +65,11 @@ setup_configs["ENABLE_POROS_BACKEND"] = os.getenv("ENABLE_POROS_BACKEND",
                                                   "OFF")
 setup_configs["ENABLE_TRT_BACKEND"] = os.getenv("ENABLE_TRT_BACKEND", "OFF")
 setup_configs["ENABLE_LITE_BACKEND"] = os.getenv("ENABLE_LITE_BACKEND", "OFF")
-setup_configs["PADDLELITE_URL"] = os.getenv("PADDLELITE_URL", "OFF")
 setup_configs["ENABLE_VISION"] = os.getenv("ENABLE_VISION", "OFF")
 setup_configs["ENABLE_FLYCV"] = os.getenv("ENABLE_FLYCV", "OFF")
 setup_configs["ENABLE_TEXT"] = os.getenv("ENABLE_TEXT", "OFF")
 setup_configs["WITH_GPU"] = os.getenv("WITH_GPU", "OFF")
 setup_configs["WITH_IPU"] = os.getenv("WITH_IPU", "OFF")
-setup_configs["WITH_XPU"] = os.getenv("WITH_XPU", "OFF")
 setup_configs["BUILD_ON_JETSON"] = os.getenv("BUILD_ON_JETSON", "OFF")
 setup_configs["TRT_DIRECTORY"] = os.getenv("TRT_DIRECTORY", "UNDEFINED")
 setup_configs["CUDA_DIRECTORY"] = os.getenv("CUDA_DIRECTORY",
@@ -80,12 +78,10 @@ setup_configs["LIBRARY_NAME"] = PACKAGE_NAME
 setup_configs["PY_LIBRARY_NAME"] = PACKAGE_NAME + "_main"
 setup_configs["OPENCV_DIRECTORY"] = os.getenv("OPENCV_DIRECTORY", "")
 setup_configs["ORT_DIRECTORY"] = os.getenv("ORT_DIRECTORY", "")
-setup_configs["PADDLEINFERENCE_DIRECTORY"] = os.getenv(
-    "PADDLEINFERENCE_DIRECTORY", "")
+setup_configs["PADDLEINFERENCE_DIRECTORY"] = os.getenv("PADDLEINFERENCE_DIRECTORY", "")
 
 setup_configs["RKNN2_TARGET_SOC"] = os.getenv("RKNN2_TARGET_SOC", "")
-if setup_configs["RKNN2_TARGET_SOC"] != "" or setup_configs[
-        "BUILD_ON_JETSON"] != "OFF":
+if setup_configs["RKNN2_TARGET_SOC"] != "" or setup_configs["BUILD_ON_JETSON"] != "OFF":
     REQUIRED_PACKAGES = REQUIRED_PACKAGES.replace("opencv-python", "")
 
 if setup_configs["WITH_GPU"] == "ON" or setup_configs[

From 2d998223ac443cfd308766bef20f7c803fc3537e Mon Sep 17 00:00:00 2001
From: Jason <jiangjiajun@baidu.com>
Date: Fri, 16 Dec 2022 11:22:30 +0800
Subject: [PATCH 71/77] [Backend] Add KunlunXin XPU deploy support (#894)

Revert "Revert "[Backend] Add KunlunXin XPU deploy support" (#893)"

This reverts commit 0990ab9b50f13109bbd82b1299d37eb75301e2ec.
---
 CMakeLists.txt                                |  20 ++-
 FastDeploy.cmake.in                           |   5 +
 cmake/summary.cmake                           |   2 +
 docs/README_CN.md                             |   1 +
 docs/README_EN.md                             |   5 +-
 docs/cn/build_and_install/README.md           |   8 +-
 docs/cn/build_and_install/a311d.md            |   3 +-
 docs/cn/build_and_install/rv1126.md           |   7 +-
 docs/cn/build_and_install/xpu.md              |  75 +++++++++
 docs/en/build_and_install/README.md           |   5 +
 docs/en/build_and_install/a311d.md            | 105 ++++++++++++
 docs/en/build_and_install/rv1126.md           | 105 ++++++++++++
 docs/en/build_and_install/xpu.md              |  78 +++++++++
 .../classification/paddleclas/cpp/README.md   |   4 +
 .../classification/paddleclas/cpp/infer.cc    |  30 +++-
 .../paddleclas/python/README.md               |   2 +
 .../classification/paddleclas/python/infer.py |   3 +
 .../detection/yolov5/cpp/CMakeLists.txt       |   4 +
 .../vision/detection/yolov5/cpp/README.md     |  24 ++-
 examples/vision/detection/yolov5/cpp/infer.cc |   2 +-
 .../yolov5/cpp/infer_paddle_model.cc          | 154 ++++++++++++++++++
 .../vision/detection/yolov5/python/README.md  |  11 +-
 .../vision/detection/yolov5/python/infer.py   |  21 ++-
 fastdeploy/backends/lite/lite_backend.cc      |  56 +++++--
 fastdeploy/backends/lite/lite_backend.h       |   9 +
 fastdeploy/core/fd_type.cc                    |   6 +
 fastdeploy/core/fd_type.h                     |   2 +-
 fastdeploy/fastdeploy_model.cc                |  33 +++-
 fastdeploy/fastdeploy_model.h                 |   4 +
 fastdeploy/pybind/runtime.cc                  |  17 +-
 fastdeploy/runtime.cc                         |  35 +++-
 fastdeploy/runtime.h                          |  41 +++++
 .../vision/classification/ppcls/model.cc      |   1 +
 .../detection/contrib/rknpu2/postprocessor.h  |   5 +-
 .../vision/detection/contrib/rknpu2/utils.h   |   2 +-
 .../vision/detection/contrib/yolov5/yolov5.cc |   1 +
 fastdeploy/vision/detection/ppdet/model.h     |   6 +-
 python/fastdeploy/runtime.py                  |  28 ++++
 python/setup.py                               |   8 +-
 39 files changed, 870 insertions(+), 58 deletions(-)
 mode change 100644 => 100755 docs/README_CN.md
 mode change 100644 => 100755 docs/README_EN.md
 create mode 100755 docs/cn/build_and_install/xpu.md
 mode change 100644 => 100755 docs/en/build_and_install/README.md
 create mode 100755 docs/en/build_and_install/a311d.md
 create mode 100755 docs/en/build_and_install/rv1126.md
 create mode 100755 docs/en/build_and_install/xpu.md
 mode change 100644 => 100755 examples/vision/classification/paddleclas/cpp/README.md
 mode change 100644 => 100755 examples/vision/classification/paddleclas/cpp/infer.cc
 mode change 100644 => 100755 examples/vision/classification/paddleclas/python/README.md
 mode change 100644 => 100755 examples/vision/classification/paddleclas/python/infer.py
 mode change 100644 => 100755 examples/vision/detection/yolov5/cpp/CMakeLists.txt
 mode change 100644 => 100755 examples/vision/detection/yolov5/cpp/README.md
 mode change 100644 => 100755 examples/vision/detection/yolov5/cpp/infer.cc
 create mode 100755 examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
 mode change 100644 => 100755 examples/vision/detection/yolov5/python/README.md
 mode change 100644 => 100755 examples/vision/detection/yolov5/python/infer.py
 mode change 100644 => 100755 fastdeploy/pybind/runtime.cc
 mode change 100644 => 100755 fastdeploy/runtime.cc

diff --git a/CMakeLists.txt b/CMakeLists.txt
index c02e887a5..0bcfa4084 100755
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -40,7 +40,7 @@ if(NOT MSVC)
   add_definitions(-D_GLIBCXX_USE_CXX11_ABI=1)
 endif(NOT MSVC)
 
-if(UNIX AND (NOT APPLE) AND (NOT ANDROID) AND (NOT ENABLE_TIMVX))
+if(UNIX AND (NOT APPLE) AND (NOT ANDROID) AND (NOT WITH_TIMVX))
   include(${PROJECT_SOURCE_DIR}/cmake/patchelf.cmake)
 endif()
 
@@ -64,7 +64,8 @@ option(ENABLE_LITE_BACKEND "Whether to enable paddle lite backend." OFF)
 option(ENABLE_VISION "Whether to enable vision models usage." OFF)
 option(ENABLE_TEXT "Whether to enable text models usage." OFF)
 option(ENABLE_FLYCV "Whether to enable flycv to boost image preprocess." OFF)
-option(ENABLE_TIMVX "Whether to compile for TIMVX deploy." OFF)
+option(WITH_TIMVX "Whether to compile for TIMVX deploy." OFF)
+option(WITH_XPU "Whether to compile for KunlunXin XPU deploy." OFF)
 option(WITH_TESTING "Whether to compile with unittest." OFF)
 ############################# Options for Android cross compiling #########################
 option(WITH_OPENCV_STATIC "Use OpenCV static lib for Android." OFF)
@@ -138,10 +139,23 @@ set(HEAD_DIR "${PROJECT_SOURCE_DIR}/${CSRCS_DIR_NAME}")
 include_directories(${HEAD_DIR})
 include_directories(${CMAKE_CURRENT_BINARY_DIR})
 
-if (ENABLE_TIMVX)
+if (WITH_TIMVX)
   include(${PROJECT_SOURCE_DIR}/cmake/timvx.cmake)
 endif()
 
+if (WITH_XPU)
+  if(NOT ENABLE_LITE_BACKEND)
+      message(WARNING "While compiling with -DWITH_XPU=ON, will force to set -DENABLE_LITE_BACKEND=ON")
+      set(ENABLE_LITE_BACKEND ON)
+  endif()
+  if(NOT CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "x86_64")
+    message(FATAL_ERROR "XPU is only supported on Linux x64 platform")
+  endif()
+  if(NOT PADDLELITE_URL)
+    set(PADDLELITE_URL "https://bj.bcebos.com/fastdeploy/third_libs/lite-linux-x64-xpu-20221215.tgz")
+  endif()
+endif()
+
 
 if(ANDROID OR IOS)
   if(ENABLE_ORT_BACKEND)
diff --git a/FastDeploy.cmake.in b/FastDeploy.cmake.in
index fd0ea847a..d8c0df3d6 100755
--- a/FastDeploy.cmake.in
+++ b/FastDeploy.cmake.in
@@ -27,6 +27,7 @@ set(OPENCV_DIRECTORY "@OPENCV_DIRECTORY@")
 set(ORT_DIRECTORY "@ORT_DIRECTORY@")
 set(OPENVINO_DIRECTORY "@OPENVINO_DIRECTORY@")
 set(RKNN2_TARGET_SOC "@RKNN2_TARGET_SOC@")
+set(WITH_XPU @WITH_XPU@)
 
 set(FASTDEPLOY_LIBS "")
 set(FASTDEPLOY_INCS "")
@@ -237,6 +238,10 @@ if(ENABLE_PADDLE_FRONTEND)
   list(APPEND FASTDEPLOY_LIBS ${PADDLE2ONNX_LIB})
 endif()
 
+if(WITH_XPU)
+  list(APPEND FASTDEPLOY_LIBS -lpthread -lrt -ldl)
+endif()
+
 remove_duplicate_libraries(FASTDEPLOY_LIBS)
 
 # Print compiler information
diff --git a/cmake/summary.cmake b/cmake/summary.cmake
index 7a729484e..fc5c246ba 100755
--- a/cmake/summary.cmake
+++ b/cmake/summary.cmake
@@ -37,6 +37,8 @@ function(fastdeploy_summary)
   message(STATUS "  ENABLE_POROS_BACKEND      : ${ENABLE_POROS_BACKEND}")
   message(STATUS "  ENABLE_TRT_BACKEND        : ${ENABLE_TRT_BACKEND}")
   message(STATUS "  ENABLE_OPENVINO_BACKEND   : ${ENABLE_OPENVINO_BACKEND}")
+  message(STATUS "  WITH_TIMVX                : ${WITH_TIMVX}")
+  message(STATUS "  WITH_XPU                  : ${WITH_XPU}")
   if(ENABLE_ORT_BACKEND)
     message(STATUS "  ONNXRuntime version       : ${ONNXRUNTIME_VERSION}")
   endif()
diff --git a/docs/README_CN.md b/docs/README_CN.md
old mode 100644
new mode 100755
index a0b7b51d0..ec0267f45
--- a/docs/README_CN.md
+++ b/docs/README_CN.md
@@ -8,6 +8,7 @@
 - [GPU部署环境编译安装](cn/build_and_install/gpu.md)
 - [CPU部署环境编译安装](cn/build_and_install/cpu.md)
 - [IPU部署环境编译安装](cn/build_and_install/ipu.md)
+- [昆仑芯XPU部署环境编译安装](cn/build_and_install/xpu.md)
 - [Jetson部署环境编译安装](cn/build_and_install/jetson.md)
 - [Android平台部署环境编译安装](cn/build_and_install/android.md)
 - [服务化部署镜像编译安装](../serving/docs/zh_CN/compile.md)
diff --git a/docs/README_EN.md b/docs/README_EN.md
old mode 100644
new mode 100755
index c4f9adfa3..ed257c59b
--- a/docs/README_EN.md
+++ b/docs/README_EN.md
@@ -8,6 +8,7 @@
 - [Build and Install FastDeploy Library on GPU Platform](en/build_and_install/gpu.md)
 - [Build and Install FastDeploy Library on CPU Platform](en/build_and_install/cpu.md)
 - [Build and Install FastDeploy Library on IPU Platform](en/build_and_install/ipu.md)
+- [Build and Install FastDeploy Library on KunlunXin XPU Platform](en/build_and_install/xpu.md)
 - [Build and Install FastDeploy Library on  Nvidia Jetson Platform](en/build_and_install/jetson.md)
 - [Build and Install FastDeploy Library on Android Platform](en/build_and_install/android.md)
 - [Build and Install FastDeploy Serving Deployment Image](../serving/docs/EN/compile-en.md)
@@ -19,10 +20,10 @@
 - [A Quick Start on Runtime Python](en/quick_start/runtime/python.md)
 - [A Quick Start on Runtime C++](en/quick_start/runtime/cpp.md)
 
-## API 
+## API
 
 - [Python API](https://baidu-paddle.github.io/fastdeploy-api/python/html/)
-- [C++ API](https://baidu-paddle.github.io/fastdeploy-api/cpp/html/) 
+- [C++ API](https://baidu-paddle.github.io/fastdeploy-api/cpp/html/)
 - [Android Java API](../java/android)
 
 ## Performance Optimization
diff --git a/docs/cn/build_and_install/README.md b/docs/cn/build_and_install/README.md
index 7ec07c7b8..221852d2c 100755
--- a/docs/cn/build_and_install/README.md
+++ b/docs/cn/build_and_install/README.md
@@ -13,6 +13,7 @@
 - [Android平台部署环境](android.md)
 - [瑞芯微RV1126部署环境](rv1126.md)
 - [晶晨A311D部署环境](a311d.md)
+- [昆仑芯XPU部署环境](xpu.md)
 
 
 ## FastDeploy编译选项说明
@@ -20,10 +21,11 @@
 | 选项                      | 说明                                                                        |
 |:------------------------|:--------------------------------------------------------------------------|
 | ENABLE_ORT_BACKEND      | 默认OFF, 是否编译集成ONNX Runtime后端(CPU/GPU上推荐打开)                                 |
-| ENABLE_PADDLE_BACKEND   | 默认OFF，是否编译集成Paddle Inference后端(CPU/GPU上推荐打开)                              |  
-| ENABLE_LITE_BACKEND     | 默认OFF，是否编译集成Paddle Lite后端(编译Android库时需要设置为ON)                             |
+| ENABLE_PADDLE_BACKEND   | 默认OFF，是否编译集成Paddle Inference后端(CPU/GPU上推荐打开)                             |  
+| ENABLE_LITE_BACKEND     | 默认OFF，是否编译集成Paddle Lite后端(编译Android库时需要设置为ON)                          |
 | ENABLE_RKNPU2_BACKEND   | 默认OFF，是否编译集成RKNPU2后端(RK3588/RK3568/RK3566上推荐打开)                           |
-| WITH_TIMVX            | 默认OFF，需要在RV1126/RV1109/A311D上部署时，需设置为ON                                   |
+| WITH_XPU                | 默认OFF，当在昆仑芯XPU上部署时，需设置为ON                                                |
+| WITH_TIMVX              | 默认OFF，需要在RV1126/RV1109/A311D上部署时，需设置为ON                                   |
 | ENABLE_TRT_BACKEND      | 默认OFF，是否编译集成TensorRT后端(GPU上推荐打开)                                          |
 | ENABLE_OPENVINO_BACKEND | 默认OFF，是否编译集成OpenVINO后端(CPU上推荐打开)                                          |
 | ENABLE_VISION           | 默认OFF，是否编译集成视觉模型的部署模块                                                     |
diff --git a/docs/cn/build_and_install/a311d.md b/docs/cn/build_and_install/a311d.md
index 4b3773f0d..20dde7046 100755
--- a/docs/cn/build_and_install/a311d.md
+++ b/docs/cn/build_and_install/a311d.md
@@ -9,7 +9,8 @@ FastDeploy 基于 Paddle-Lite 后端支持在晶晨 NPU 上进行部署推理。
 |编译选项|默认值|说明|备注|  
 |:---|:---|:---|:---|  
 |ENABLE_LITE_BACKEND|OFF|编译A311D部署库时需要设置为ON| - |
-|WITH_TIMVX|OFF|编译A311D部署库时需要设置为ON| - |
+|WITH_TIMVX|OFF|编译A311D部署库时需要设置为ON| - |  
+|TARGET_ABI|NONE|编译RK库时需要设置为arm64| - |
 
 更多编译选项请参考[FastDeploy编译选项说明](./README.md)
 
diff --git a/docs/cn/build_and_install/rv1126.md b/docs/cn/build_and_install/rv1126.md
index ff0050715..f3643f070 100755
--- a/docs/cn/build_and_install/rv1126.md
+++ b/docs/cn/build_and_install/rv1126.md
@@ -8,8 +8,9 @@ FastDeploy基于 Paddle-Lite 后端支持在瑞芯微（Rockchip）Soc 上进行
 相关编译选项说明如下：  
 |编译选项|默认值|说明|备注|  
 |:---|:---|:---|:---|  
-|ENABLE_LITE_BACKEND|OFF|编译RK库时需要设置为ON| - |
-|WITH_TIMVX|OFF|编译RK库时需要设置为ON| - |
+|ENABLE_LITE_BACKEND|OFF|编译RK库时需要设置为ON| - |  
+|WITH_TIMVX|OFF|编译RK库时需要设置为ON| - |  
+|TARGET_ABI|NONE|编译RK库时需要设置为armhf| - |
 
 更多编译选项请参考[FastDeploy编译选项说明](./README.md)
 
@@ -86,7 +87,7 @@ dmesg | grep Galcore
 wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
 tar -xf PaddleLite-generic-demo.tar.gz
 ```
-2. 使用 `uname -a` 查看 `Linux Kernel` 版本，确定为 `Linux` 系统 4.19.111 版本，
+2. 使用 `uname -a` 查看 `Linux Kernel` 版本，确定为 `Linux` 系统 4.19.111 版本
 3. 将 `PaddleLite-generic-demo/libs/PaddleLite/linux/armhf/lib/verisilicon_timvx/viv_sdk_6_4_6_5/lib/1126/4.19.111/` 路径下的 `galcore.ko` 上传至开发板。
 
 4. 登录开发板，命令行输入 `sudo rmmod galcore` 来卸载原始驱动，输入 `sudo insmod galcore.ko` 来加载传上设备的驱动。（是否需要 sudo 根据开发板实际情况，部分 adb 链接的设备请提前 adb root）。此步骤如果操作失败，请跳转至方法 2。
diff --git a/docs/cn/build_and_install/xpu.md b/docs/cn/build_and_install/xpu.md
new file mode 100755
index 000000000..014eb804d
--- /dev/null
+++ b/docs/cn/build_and_install/xpu.md
@@ -0,0 +1,75 @@
+# 昆仑芯 XPU 部署环境编译安装
+
+FastDeploy 基于 Paddle-Lite 后端支持在昆仑芯 XPU 上进行部署推理。
+更多详细的信息请参考：[PaddleLite部署示例](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/kunlunxin_xpu.html#xpu)。
+
+本文档介绍如何编译基于 PaddleLite 的 C++ FastDeploy 编译库。
+
+相关编译选项说明如下：  
+|编译选项|默认值|说明|备注|  
+|:---|:---|:---|:---|  
+| WITH_XPU| OFF | 需要在XPU上部署时需要设置为ON | - |
+| ENABLE_ORT_BACKEND | OFF | 是否编译集成ONNX Runtime后端 | - |
+| ENABLE_PADDLE_BACKEND | OFF | 是否编译集成Paddle Inference后端 | - |
+| ENABLE_OPENVINO_BACKEND | OFF | 是否编译集成OpenVINO后端 | - |
+| ENABLE_VISION | OFF | 是否编译集成视觉模型的部署模块 | - |
+| ENABLE_TEXT | OFF | 是否编译集成文本NLP模型的部署模块 | - |
+
+第三方库依赖指定（不设定如下参数，会自动下载预编译库）
+| 选项                     | 说明                                                                                           |
+| :---------------------- | :--------------------------------------------------------------------------------------------- |
+| ORT_DIRECTORY           | 当开启ONNX Runtime后端时，用于指定用户本地的ONNX Runtime库路径；如果不指定，编译过程会自动下载ONNX Runtime库  |
+| OPENCV_DIRECTORY        | 当ENABLE_VISION=ON时，用于指定用户本地的OpenCV库路径；如果不指定，编译过程会自动下载OpenCV库              |
+| OPENVINO_DIRECTORY      | 当开启OpenVINO后端时, 用于指定用户本地的OpenVINO库路径；如果不指定，编译过程会自动下载OpenVINO库             |
+更多编译选项请参考[FastDeploy编译选项说明](./README.md)
+
+## 基于 PaddleLite 的 C++ FastDeploy 库编译
+- OS: Linux
+- gcc/g++: version >= 8.2
+- cmake: version >= 3.15
+此外更推荐开发者自行安装，编译时通过`-DOPENCV_DIRECTORY`来指定环境中的OpenCV（如若不指定-DOPENCV_DIRECTORY，会自动下载FastDeploy提供的预编译的OpenCV，但在**Linux平台**无法支持Video的读取，以及imshow等可视化界面功能）
+```
+sudo apt-get install libopencv-dev
+```
+编译命令如下：
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with KunlunXin xpu toolchain
+cmake -DWITH_XPU=ON  \
+      -DWITH_GPU=OFF  \ # 不编译 GPU
+      -DENABLE_ORT_BACKEND=ON  \ # 可选择开启 ORT 后端
+      -DENABLE_PADDLE_BACKEND=ON  \ # 可选择开启 Paddle 后端
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-xpu \
+      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
+      -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
+      ..
+
+# Build FastDeploy KunlunXin XPU C++ SDK
+make -j8
+make install
+```  
+编译完成之后，会生成 fastdeploy-xpu 目录，表示基于 PadddleLite 的 FastDeploy 库编译完成。
+
+## Python 编译
+编译命令如下：
+```bash
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/python
+export WITH_XPU=ON
+export WITH_GPU=OFF
+export ENABLE_ORT_BACKEND=ON
+export ENABLE_PADDLE_BACKEND=ON
+export ENABLE_VISION=ON
+# OPENCV_DIRECTORY可选，不指定会自动下载FastDeploy提供的预编译OpenCV库
+export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
+
+python setup.py build
+python setup.py bdist_wheel
+```  
+编译完成即会在 `FastDeploy/python/dist` 目录下生成编译后的 `wheel` 包，直接 pip install 即可
+
+编译过程中，如若修改编译参数，为避免带来缓存影响，可删除 `FastDeploy/python` 目录下的 `build` 和 `.setuptools-cmake-build` 两个子目录后再重新编译
diff --git a/docs/en/build_and_install/README.md b/docs/en/build_and_install/README.md
old mode 100644
new mode 100755
index 4beaaeec8..0958c3778
--- a/docs/en/build_and_install/README.md
+++ b/docs/en/build_and_install/README.md
@@ -12,6 +12,9 @@ English | [中文](../../cn/build_and_install/README.md)
 - [Build and Install on IPU Platform](ipu.md)
 - [Build and Install on Nvidia Jetson Platform](jetson.md)
 - [Build and Install on Android Platform](android.md)
+- [Build and Install on RV1126 Platform](rv1126.md)
+- [Build and Install on A311D Platform](a311d.md)
+- [Build and Install on KunlunXin XPU Platform](xpu.md)
 
 
 ## Build options
@@ -25,6 +28,8 @@ English | [中文](../../cn/build_and_install/README.md)
 | ENABLE_VISION | Default OFF，whether to enable vision models deployment module |
 | ENABLE_TEXT | Default OFF，whether to enable text models deployment module |
 | WITH_GPU | Default OFF, if build on GPU, this need to be ON |
+| WITH_XPU | Default OFF，if deploy on KunlunXin XPU，this need to be ON |
+| WITH_TIMVX | Default OFF，if deploy on RV1126/RV1109/A311D，this need to be ON |
 | CUDA_DIRECTORY | Default /usr/local/cuda, if build on GPU, this defines the path of CUDA(>=11.2) |
 | TRT_DIRECTORY | If build with ENABLE_TRT_BACKEND=ON, this defines the path of TensorRT(>=8.4) |
 | ORT_DIRECTORY | [Optional] If build with ENABLE_ORT_BACKEND=ON, this flag defines the path of ONNX Runtime, but if this flag is not set, it will download ONNX Runtime library automatically |
diff --git a/docs/en/build_and_install/a311d.md b/docs/en/build_and_install/a311d.md
new file mode 100755
index 000000000..872c1b93c
--- /dev/null
+++ b/docs/en/build_and_install/a311d.md
@@ -0,0 +1,105 @@
+# How to Build A311D Deployment Environment
+
+FastDeploy supports AI deployment on Rockchip Soc based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html).
+
+This document describes how to compile the PaddleLite-based C++ FastDeploy cross-compilation library.
+
+The relevant compilation options are described as follows:  
+|Compile Options|Default Values|Description|Remarks|  
+|:---|:---|:---|:---|  
+|ENABLE_LITE_BACKEND|OFF|It needs to be set to ON when compiling the A311D library| - |  
+|WITH_TIMVX|OFF|It needs to be set to ON when compiling the A311D library| - |  
+|TARGET_ABI|NONE|It needs to be set to arm64 when compiling the A311D library| - |  
+
+For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
+
+## Cross-compilation environment construction
+
+### Host Environment Requirements  
+- os：Ubuntu == 16.04
+- cmake： version >= 3.10.0  
+
+### Building the compilation environment
+You can enter the FastDeploy/tools/timvx directory and use the following command to install:
+```bash
+cd FastDeploy/tools/timvx
+bash install.sh
+```
+You can also install it with the following commands:
+```bash
+ # 1. Install basic software
+apt update
+apt-get install -y --no-install-recommends \
+  gcc g++ git make wget python unzip
+
+# 2. Install arm gcc toolchains
+apt-get install -y --no-install-recommends \
+  g++-arm-linux-gnueabi gcc-arm-linux-gnueabi \
+  g++-arm-linux-gnueabihf gcc-arm-linux-gnueabihf \
+  gcc-aarch64-linux-gnu g++-aarch64-linux-gnu
+
+# 3. Install cmake 3.10 or above
+wget -c https://mms-res.cdn.bcebos.com/cmake-3.10.3-Linux-x86_64.tar.gz && \
+  tar xzf cmake-3.10.3-Linux-x86_64.tar.gz && \
+  mv cmake-3.10.3-Linux-x86_64 /opt/cmake-3.10 && \
+  ln -s /opt/cmake-3.10/bin/cmake /usr/bin/cmake && \
+  ln -s /opt/cmake-3.10/bin/ccmake /usr/bin/ccmake
+```
+
+## FastDeploy cross-compilation library compilation based on PaddleLite
+After setting up the cross-compilation environment, the compilation command is as follows:
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with A311D toolchain
+cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/toolchain.cmake \
+      -DWITH_TIMVX=ON  \
+      -DTARGET_ABI=arm64 \
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-tmivx \
+      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
+      -Wno-dev ..
+
+# Build FastDeploy A311D C++ SDK
+make -j8
+make install
+```  
+After the compilation is complete, the fastdeploy-tmivx directory will be generated, indicating that the FastDeploy library based on PadddleLite TIM-VX has been compiled.
+
+## Prepare the Soc environment
+Before deployment, ensure that the version of the driver galcore.so of the Verisilicon Linux Kernel NPU meets the requirements. Before deployment, please log in to the development board, and enter the following command through the command line to query the NPU driver version. The recommended version of the Rockchip driver is: 6.4.4.3
+```bash
+dmesg | grep Galcore
+```  
+If the current version does not comply with the above, please read the following content carefully to ensure that the underlying NPU driver environment is correct.
+
+There are two ways to modify the current NPU driver version:
+1. Manually replace the NPU driver version. (recommend)
+2. flash the machine, and flash the firmware that meets the requirements of the NPU driver version.
+
+### Manually replace the NPU driver version
+1. Use the following command to download and decompress the PaddleLite demo, which provides ready-made driver files
+```bash
+wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
+tar -xf PaddleLite-generic-demo.tar.gz
+```
+2. Use `uname -a` to check `Linux Kernel` version, it is determined to be version 4.19.111.
+3. Upload `galcore.ko` under `PaddleLite-generic-demo/libs/PaddleLite/linux/arm64/lib/verisilicon_timvx/viv_sdk_6_4_4_3/lib/a311d/4.9.113` path to the development board.
+4. Log in to the development board, enter `sudo rmmod galcore` on the command line to uninstall the original driver, and enter `sudo insmod galcore.ko` to load the uploaded device driver. (Whether sudo is needed depends on the actual situation of the development board. For some adb-linked devices, please adb root in advance). If this step fails, go to method 2.
+5. Enter `dmesg | grep Galcore` in the development board to query the NPU driver version, and it is determined to be: 6.4.4.3
+
+### flash
+According to the specific development board model, ask the development board seller or the official website customer service for the firmware and flashing method corresponding to the 6.4.4.3 version of the NPU driver.
+
+For more details, please refer to: [PaddleLite prepares the device environment](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html#zhunbeishebeihuanjing)
+
+## Deployment example based on FastDeploy on A311D
+1. For deploying the PaddleClas classification model on A311D, please refer to: [C++ deployment example of PaddleClas classification model on A311D](../../../examples/vision/classification/paddleclas/a311d/README.md)
+
+2. For deploying PPYOLOE detection model on A311D, please refer to: [C++ deployment example of PPYOLOE detection model on A311D](../../../examples/vision/detection/paddledetection/a311d/README.md)
+
+3. For deploying YOLOv5 detection model on A311D, please refer to: [C++ Deployment Example of YOLOv5 Detection Model on A311D](../../../examples/vision/detection/yolov5/a311d/README.md)
+
+4. For deploying PP-LiteSeg segmentation model on A311D, please refer to: [C++ Deployment Example of PP-LiteSeg Segmentation Model on A311D](../../../examples/vision/segmentation/paddleseg/a311d/README.md)
diff --git a/docs/en/build_and_install/rv1126.md b/docs/en/build_and_install/rv1126.md
new file mode 100755
index 000000000..a56535363
--- /dev/null
+++ b/docs/en/build_and_install/rv1126.md
@@ -0,0 +1,105 @@
+# How to Build RV1126 Deployment Environment
+
+FastDeploy supports AI deployment on Rockchip Soc based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html).
+
+This document describes how to compile the PaddleLite-based C++ FastDeploy cross-compilation library.
+
+The relevant compilation options are described as follows:  
+|Compile Options|Default Values|Description|Remarks|  
+|:---|:---|:---|:---|  
+|ENABLE_LITE_BACKEND|OFF|It needs to be set to ON when compiling the RK library| - |  
+|WITH_TIMVX|OFF|It needs to be set to ON when compiling the RK library| - |  
+|TARGET_ABI|NONE|It needs to be set to armhf when compiling the RK library| - |  
+
+For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
+
+## Cross-compilation environment construction
+
+### Host Environment Requirements  
+- os：Ubuntu == 16.04
+- cmake： version >= 3.10.0  
+
+### Building the compilation environment
+You can enter the FastDeploy/tools/timvx directory and use the following command to install:
+```bash
+cd FastDeploy/tools/timvx
+bash install.sh
+```
+You can also install it with the following commands:
+```bash
+ # 1. Install basic software
+apt update
+apt-get install -y --no-install-recommends \
+  gcc g++ git make wget python unzip
+
+# 2. Install arm gcc toolchains
+apt-get install -y --no-install-recommends \
+  g++-arm-linux-gnueabi gcc-arm-linux-gnueabi \
+  g++-arm-linux-gnueabihf gcc-arm-linux-gnueabihf \
+  gcc-aarch64-linux-gnu g++-aarch64-linux-gnu
+
+# 3. Install cmake 3.10 or above
+wget -c https://mms-res.cdn.bcebos.com/cmake-3.10.3-Linux-x86_64.tar.gz && \
+  tar xzf cmake-3.10.3-Linux-x86_64.tar.gz && \
+  mv cmake-3.10.3-Linux-x86_64 /opt/cmake-3.10 && \
+  ln -s /opt/cmake-3.10/bin/cmake /usr/bin/cmake && \
+  ln -s /opt/cmake-3.10/bin/ccmake /usr/bin/ccmake
+```
+
+## FastDeploy cross-compilation library compilation based on PaddleLite
+After setting up the cross-compilation environment, the compilation command is as follows:
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with RK toolchain
+cmake -DCMAKE_TOOLCHAIN_FILE=./../cmake/toolchain.cmake \
+      -DWITH_TIMVX=ON  \
+      -DTARGET_ABI=armhf \
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-tmivx \
+      -DENABLE_VISION=ON \ # 是否编译集成视觉模型的部署模块，可选择开启
+      -Wno-dev ..
+
+# Build FastDeploy RV1126 C++ SDK
+make -j8
+make install
+```  
+After the compilation is complete, the fastdeploy-tmivx directory will be generated, indicating that the FastDeploy library based on PadddleLite TIM-VX has been compiled.
+
+## Prepare the Soc environment
+Before deployment, ensure that the version of the driver galcore.so of the Verisilicon Linux Kernel NPU meets the requirements. Before deployment, please log in to the development board, and enter the following command through the command line to query the NPU driver version. The recommended version of the Rockchip driver is: 6.4.6.5
+```bash
+dmesg | grep Galcore
+```  
+If the current version does not comply with the above, please read the following content carefully to ensure that the underlying NPU driver environment is correct.
+
+There are two ways to modify the current NPU driver version:
+1. Manually replace the NPU driver version. (recommend)
+2. flash the machine, and flash the firmware that meets the requirements of the NPU driver version.
+
+### Manually replace the NPU driver version
+1. Use the following command to download and decompress the PaddleLite demo, which provides ready-made driver files
+```bash
+wget https://paddlelite-demo.bj.bcebos.com/devices/generic/PaddleLite-generic-demo.tar.gz
+tar -xf PaddleLite-generic-demo.tar.gz
+```
+2. Use `uname -a` to check `Linux Kernel` version, it is determined to be version 4.19.111.
+3. Upload `galcore.ko` under `PaddleLite-generic-demo/libs/PaddleLite/linux/armhf/lib/verisilicon_timvx/viv_sdk_6_4_6_5/lib/1126/4.19.111/` path to the development board.
+4. Log in to the development board, enter `sudo rmmod galcore` on the command line to uninstall the original driver, and enter `sudo insmod galcore.ko` to load the uploaded device driver. (Whether sudo is needed depends on the actual situation of the development board. For some adb-linked devices, please adb root in advance). If this step fails, go to method 2.
+5. Enter `dmesg | grep Galcore` in the development board to query the NPU driver version, and it is determined to be: 6.4.6.5
+
+### flash
+According to the specific development board model, ask the development board seller or the official website customer service for the firmware and flashing method corresponding to the 6.4.6.5 version of the NPU driver.
+
+For more details, please refer to: [PaddleLite prepares the device environment](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/verisilicon_timvx.html#zhunbeishebeihuanjing)
+
+## Deployment example based on FastDeploy on RV1126
+1. For deploying the PaddleClas classification model on RV1126, please refer to: [C++ deployment example of PaddleClas classification model on RV1126](../../../examples/vision/classification/paddleclas/rv1126/README.md)
+
+2. For deploying PPYOLOE detection model on RV1126, please refer to: [C++ deployment example of PPYOLOE detection model on RV1126](../../../examples/vision/detection/paddledetection/rv1126/README.md)
+
+3. For deploying YOLOv5 detection model on RV1126, please refer to: [C++ Deployment Example of YOLOv5 Detection Model on RV1126](../../../examples/vision/detection/yolov5/rv1126/README.md)
+
+4. For deploying PP-LiteSeg segmentation model on RV1126, please refer to: [C++ Deployment Example of PP-LiteSeg Segmentation Model on RV1126](../../../examples/vision/segmentation/paddleseg/rv1126/README.md)
diff --git a/docs/en/build_and_install/xpu.md b/docs/en/build_and_install/xpu.md
new file mode 100755
index 000000000..403837e5d
--- /dev/null
+++ b/docs/en/build_and_install/xpu.md
@@ -0,0 +1,78 @@
+# How to Build KunlunXin XPU Deployment Environment
+
+FastDeploy supports deployment AI on KunlunXin XPU based on Paddle-Lite backend. For more detailed information, please refer to: [PaddleLite Deployment Example](https://www.paddlepaddle.org.cn/lite/develop/demo_guides/kunlunxin_xpu.html#xpu)。
+
+This document describes how to compile the C++ FastDeploy library based on PaddleLite.
+
+The relevant compilation options are described as follows:  
+|Compile Options|Default Values|Description|Remarks|  
+|:---|:---|:---|:---|  
+| ENABLE_LITE_BACKEND | OFF | It needs to be set to ON when compiling the RK library| - |  
+| WITH_XPU | OFF | It needs to be set to ON when compiling the KunlunXin XPU library| - |
+| ENABLE_ORT_BACKEND | OFF | whether to intergrate ONNX Runtime backend | - |
+| ENABLE_PADDLE_BACKEND | OFF | whether to intergrate Paddle Inference backend | - |
+| ENABLE_OPENVINO_BACKEND | OFF | whether to intergrate OpenVINO backend | - |
+| ENABLE_VISION | OFF | whether to intergrate vision models | - |
+| ENABLE_TEXT | OFF | whether to intergrate text models | - |
+
+The configuration for third libraries(Optional, if the following option is not defined, the prebuilt third libraries will download automaticly while building FastDeploy).
+| Option                     | Description                                                                                           |
+| :---------------------- | :--------------------------------------------------------------------------------------------- |
+| ORT_DIRECTORY           | While ENABLE_ORT_BACKEND=ON, use ORT_DIRECTORY to specify your own ONNX Runtime library path.  |
+| OPENCV_DIRECTORY        | While ENABLE_VISION=ON, use OPENCV_DIRECTORY to specify your own OpenCV library path.     |
+| OPENVINO_DIRECTORY      |  While ENABLE_OPENVINO_BACKEND=ON, use OPENVINO_DIRECTORY to specify your own OpenVINO library path.    |
+
+For more compilation options, please refer to [Description of FastDeploy compilation options](./README.md)
+
+## C++ FastDeploy library compilation based on PaddleLite
+- OS: Linux
+- gcc/g++: version >= 8.2
+- cmake: version >= 3.15
+
+It it recommend install OpenCV library manually, and define `-DOPENCV_DIRECTORY` to set path of OpenCV library(If the flag is not defined, a prebuilt OpenCV library will be downloaded automaticly while building FastDeploy, but the prebuilt OpenCV cannot support reading video file or other function e.g `imshow`)
+```
+sudo apt-get install libopencv-dev
+```
+
+The compilation command is as follows:
+```bash
+# Download the latest source code
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy  
+mkdir build && cd build
+
+# CMake configuration with KunlunXin xpu toolchain
+cmake -DWITH_XPU=ON  \
+      -DWITH_GPU=OFF  \
+      -DENABLE_ORT_BACKEND=ON  \
+      -DENABLE_PADDLE_BACKEND=ON  \
+      -DCMAKE_INSTALL_PREFIX=fastdeploy-xpu \
+      -DENABLE_VISION=ON \
+      -DOPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4 \
+      ..
+
+# Build FastDeploy KunlunXin XPU C++ SDK
+make -j8
+make install
+```  
+After the compilation is complete, the fastdeploy-xpu directory will be generated, indicating that the PadddleLite-based FastDeploy library has been compiled.
+
+## Python compile
+The compilation command is as follows:
+```bash
+git clone https://github.com/PaddlePaddle/FastDeploy.git
+cd FastDeploy/python
+export WITH_XPU=ON
+export WITH_GPU=OFF
+export ENABLE_ORT_BACKEND=ON
+export ENABLE_PADDLE_BACKEND=ON
+export ENABLE_VISION=ON
+# The OPENCV_DIRECTORY is optional, if not exported, a prebuilt OpenCV library will be downloaded
+export OPENCV_DIRECTORY=/usr/lib/x86_64-linux-gnu/cmake/opencv4
+
+python setup.py build
+python setup.py bdist_wheel
+```  
+After the compilation is completed, the compiled `wheel` package will be generated in the `FastDeploy/python/dist` directory, just pip install it directly
+
+During the compilation process, if you modify the compilation parameters, in order to avoid the cache impact, you can delete the two subdirectories `build` and `.setuptools-cmake-build` under the `FastDeploy/python` directory and then recompile.
diff --git a/examples/vision/classification/paddleclas/cpp/README.md b/examples/vision/classification/paddleclas/cpp/README.md
old mode 100644
new mode 100755
index 066340467..dff76da18
--- a/examples/vision/classification/paddleclas/cpp/README.md
+++ b/examples/vision/classification/paddleclas/cpp/README.md
@@ -30,6 +30,10 @@ wget https://gitee.com/paddlepaddle/PaddleClas/raw/release/2.4/deploy/images/Ima
 ./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 1
 # GPU上TensorRT推理
 ./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 2
+# IPU推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 3
+# KunlunXin XPU推理
+./infer_demo ResNet50_vd_infer ILSVRC2012_val_00000010.jpeg 4
 ```
 
 以上命令只适用于Linux或MacOS, Windows下SDK的使用方式请参考:  
diff --git a/examples/vision/classification/paddleclas/cpp/infer.cc b/examples/vision/classification/paddleclas/cpp/infer.cc
old mode 100644
new mode 100755
index bdd87ecdc..244accfa7
--- a/examples/vision/classification/paddleclas/cpp/infer.cc
+++ b/examples/vision/classification/paddleclas/cpp/infer.cc
@@ -96,6 +96,32 @@ void IpuInfer(const std::string& model_dir, const std::string& image_file) {
   std::cout << res.Str() << std::endl;
 }
 
+void XpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "inference.pdmodel";
+  auto params_file = model_dir + sep + "inference.pdiparams";
+  auto config_file = model_dir + sep + "inference_cls.yaml";
+
+  auto option = fastdeploy::RuntimeOption();
+  option.UseXpu();
+  auto model = fastdeploy::vision::classification::PaddleClasModel(
+      model_file, params_file, config_file, option);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::ClassifyResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+
+  // print res
+  std::cout << res.Str() << std::endl;
+}
+
 void TrtInfer(const std::string& model_dir, const std::string& image_file) {
   auto model_file = model_dir + sep + "inference.pdmodel";
   auto params_file = model_dir + sep + "inference.pdiparams";
@@ -128,7 +154,7 @@ int main(int argc, char* argv[]) {
                  "e.g ./infer_demo ./ResNet50_vd ./test.jpeg 0"
               << std::endl;
     std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
-                 "with gpu; 2: run with gpu and use tensorrt backend."
+                 "with gpu; 2: run with gpu and use tensorrt backend; 3: run with ipu; 4: run with xpu."
               << std::endl;
     return -1;
   }
@@ -141,6 +167,8 @@ int main(int argc, char* argv[]) {
     TrtInfer(argv[1], argv[2]);
   } else if (std::atoi(argv[3]) == 3) {
     IpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 4) {
+    XpuInfer(argv[1], argv[2]);
   }
   return 0;
 }
diff --git a/examples/vision/classification/paddleclas/python/README.md b/examples/vision/classification/paddleclas/python/README.md
old mode 100644
new mode 100755
index 9d17e6f65..5a1baff7f
--- a/examples/vision/classification/paddleclas/python/README.md
+++ b/examples/vision/classification/paddleclas/python/README.md
@@ -25,6 +25,8 @@ python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg -
 python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device gpu --use_trt True --topk 1
 # IPU推理（注意：IPU推理首次运行会有序列化模型的操作，有一定耗时，需要耐心等待）
 python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device ipu --topk 1
+# XPU推理
+python infer.py --model ResNet50_vd_infer --image ILSVRC2012_val_00000010.jpeg --device xpu --topk 1
 ```
 
 运行完成后返回结果如下所示
diff --git a/examples/vision/classification/paddleclas/python/infer.py b/examples/vision/classification/paddleclas/python/infer.py
old mode 100644
new mode 100755
index 0b2d35a21..3c150533c
--- a/examples/vision/classification/paddleclas/python/infer.py
+++ b/examples/vision/classification/paddleclas/python/infer.py
@@ -35,6 +35,9 @@ def build_option(args):
     if args.device.lower() == "ipu":
         option.use_ipu()
 
+    if args.device.lower() == "xpu":
+        option.use_xpu()
+
     if args.use_trt:
         option.use_trt_backend()
     return option
diff --git a/examples/vision/detection/yolov5/cpp/CMakeLists.txt b/examples/vision/detection/yolov5/cpp/CMakeLists.txt
old mode 100644
new mode 100755
index 93540a7e8..2b3f8c54f
--- a/examples/vision/detection/yolov5/cpp/CMakeLists.txt
+++ b/examples/vision/detection/yolov5/cpp/CMakeLists.txt
@@ -12,3 +12,7 @@ include_directories(${FASTDEPLOY_INCS})
 add_executable(infer_demo ${PROJECT_SOURCE_DIR}/infer.cc)
 # 添加FastDeploy库依赖
 target_link_libraries(infer_demo ${FASTDEPLOY_LIBS})
+
+add_executable(infer_paddle_demo ${PROJECT_SOURCE_DIR}/infer_paddle_model.cc)
+# 添加FastDeploy库依赖
+target_link_libraries(infer_paddle_demo ${FASTDEPLOY_LIBS})
diff --git a/examples/vision/detection/yolov5/cpp/README.md b/examples/vision/detection/yolov5/cpp/README.md
old mode 100644
new mode 100755
index ece3826a5..581f1c49b
--- a/examples/vision/detection/yolov5/cpp/README.md
+++ b/examples/vision/detection/yolov5/cpp/README.md
@@ -12,16 +12,33 @@
 ```bash
 mkdir build
 cd build
-# 下载FastDeploy预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
+# 下载 FastDeploy 预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
 wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz
 tar xvf fastdeploy-linux-x64-x.x.x.tgz
 cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
 make -j
-#下载官方转换好的yolov5模型文件和测试图片
-wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx
+#下载官方转换好的 yolov5 Paddle 模型文件和测试图片
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s_infer.tar
+tar -xvf yolov5s_infer.tar
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
 
+# CPU推理
+./infer_paddle_demo yolov5s_infer 000000014439.jpg 0
+# GPU推理
+./infer_paddle_demo yolov5s_infer 000000014439.jpg 1
+# GPU上TensorRT推理
+./infer_paddle_demo yolov5s_infer 000000014439.jpg 2
+# XPU推理
+./infer_paddle_demo yolov5s_infer 000000014439.jpg 3
+```
+
+上述的模型为 Paddle 模型的推理，如果想要做 ONNX 模型的推理，可以按照如下步骤：
+```bash
+# 1. 下载官方转换好的 yolov5 ONNX 模型文件和测试图片
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx
+wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
+
 # CPU推理
 ./infer_demo yolov5s.onnx 000000014439.jpg 0
 # GPU推理
@@ -29,7 +46,6 @@ wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/0000000
 # GPU上TensorRT推理
 ./infer_demo yolov5s.onnx 000000014439.jpg 2
 ```
-
 运行完成可视化结果如下图所示
 
 <img width="640" src="https://user-images.githubusercontent.com/67993288/184309358-d803347a-8981-44b6-b589-4608021ad0f4.jpg">
diff --git a/examples/vision/detection/yolov5/cpp/infer.cc b/examples/vision/detection/yolov5/cpp/infer.cc
old mode 100644
new mode 100755
index 1c3907918..fb20686de
--- a/examples/vision/detection/yolov5/cpp/infer.cc
+++ b/examples/vision/detection/yolov5/cpp/infer.cc
@@ -102,4 +102,4 @@ int main(int argc, char* argv[]) {
     TrtInfer(argv[1], argv[2]);
   }
   return 0;
-}
+}
\ No newline at end of file
diff --git a/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc b/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
new file mode 100755
index 000000000..d5692ce7c
--- /dev/null
+++ b/examples/vision/detection/yolov5/cpp/infer_paddle_model.cc
@@ -0,0 +1,154 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fastdeploy/vision.h"
+#ifdef WIN32
+const char sep = '\\';
+#else
+const char sep = '/';
+#endif
+
+void CpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  fastdeploy::RuntimeOption option;
+  option.UseCpu();
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
+
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void GpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
+
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void TrtInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  auto option = fastdeploy::RuntimeOption();
+  option.UseGpu();
+  option.UseTrtBackend();
+  option.SetTrtInputShape("images", {1, 3, 640, 640});
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::Visualize::VisDetection(im, res);
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+void XpuInfer(const std::string& model_dir, const std::string& image_file) {
+  auto model_file = model_dir + sep + "model.pdmodel";
+  auto params_file = model_dir + sep + "model.pdiparams";
+  fastdeploy::RuntimeOption option;
+  option.UseXpu();
+  auto model = fastdeploy::vision::detection::YOLOv5(
+      model_file, params_file, option, fastdeploy::ModelFormat::PADDLE);
+
+  if (!model.Initialized()) {
+    std::cerr << "Failed to initialize." << std::endl;
+    return;
+  }
+
+  auto im = cv::imread(image_file);
+
+  fastdeploy::vision::DetectionResult res;
+  if (!model.Predict(im, &res)) {
+    std::cerr << "Failed to predict." << std::endl;
+    return;
+  }
+  std::cout << res.Str() << std::endl;
+
+  auto vis_im = fastdeploy::vision::VisDetection(im, res);
+
+  cv::imwrite("vis_result.jpg", vis_im);
+  std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
+}
+
+int main(int argc, char* argv[]) {
+  if (argc < 4) {
+    std::cout << "Usage: infer_demo path/to/model path/to/image run_option, "
+                 "e.g ./infer_model ./yolov5s_infer ./test.jpeg 0"
+              << std::endl;
+    std::cout << "The data type of run_option is int, 0: run with cpu; 1: run "
+                 "with gpu; 2: run with gpu and use tensorrt backend; 3: run with KunlunXin XPU."
+              << std::endl;
+    return -1;
+  }
+
+  if (std::atoi(argv[3]) == 0) {
+    CpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 1) {
+    GpuInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 2) {
+    TrtInfer(argv[1], argv[2]);
+  } else if (std::atoi(argv[3]) == 3) {
+    XpuInfer(argv[1], argv[2]);
+  }
+  return 0;
+}
diff --git a/examples/vision/detection/yolov5/python/README.md b/examples/vision/detection/yolov5/python/README.md
old mode 100644
new mode 100755
index 4f47b3084..83f6ed781
--- a/examples/vision/detection/yolov5/python/README.md
+++ b/examples/vision/detection/yolov5/python/README.md
@@ -13,15 +13,18 @@ git clone https://github.com/PaddlePaddle/FastDeploy.git
 cd examples/vision/detection/yolov5/python/
 
 #下载yolov5模型文件和测试图片
-wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s.onnx
+wget https://bj.bcebos.com/paddlehub/fastdeploy/yolov5s_infer.tar
+tar -xf yolov5s_infer.tar
 wget https://gitee.com/paddlepaddle/PaddleDetection/raw/release/2.4/demo/000000014439.jpg
 
 # CPU推理
-python infer.py --model yolov5s.onnx --image 000000014439.jpg --device cpu
+python infer.py --model yolov5s_infer --image 000000014439.jpg --device cpu
 # GPU推理
-python infer.py --model yolov5s.onnx --image 000000014439.jpg --device gpu
+python infer.py --model yolov5s_infer --image 000000014439.jpg --device gpu
 # GPU上使用TensorRT推理
-python infer.py --model yolov5s.onnx --image 000000014439.jpg --device gpu --use_trt True
+python infer.py --model yolov5s_infer --image 000000014439.jpg --device gpu --use_trt True
+# XPU推理
+python infer.py --model yolov5s_infer --image 000000014439.jpg --device xpu
 ```
 
 运行完成可视化结果如下图所示
diff --git a/examples/vision/detection/yolov5/python/infer.py b/examples/vision/detection/yolov5/python/infer.py
old mode 100644
new mode 100755
index 462740e9c..b155af0ed
--- a/examples/vision/detection/yolov5/python/infer.py
+++ b/examples/vision/detection/yolov5/python/infer.py
@@ -1,20 +1,20 @@
 import fastdeploy as fd
 import cv2
+import os
 
 
 def parse_arguments():
     import argparse
     import ast
     parser = argparse.ArgumentParser()
-    parser.add_argument(
-        "--model", default=None, help="Path of yolov5 onnx model.")
+    parser.add_argument("--model", default=None, help="Path of yolov5 model.")
     parser.add_argument(
         "--image", default=None, help="Path of test image file.")
     parser.add_argument(
         "--device",
         type=str,
         default='cpu',
-        help="Type of inference device, support 'cpu' or 'gpu'.")
+        help="Type of inference device, support 'cpu' or 'gpu' or 'xpu'.")
     parser.add_argument(
         "--use_trt",
         type=ast.literal_eval,
@@ -25,6 +25,8 @@ def parse_arguments():
 
 def build_option(args):
     option = fd.RuntimeOption()
+    if args.device.lower() == "xpu":
+        option.use_xpu()
 
     if args.device.lower() == "gpu":
         option.use_gpu()
@@ -37,14 +39,15 @@ def build_option(args):
 
 args = parse_arguments()
 
-if args.model is None:
-    model = fd.download_model(name='YOLOv5s')
-else:
-    model = args.model
-
 # 配置runtime，加载模型
 runtime_option = build_option(args)
-model = fd.vision.detection.YOLOv5(model, runtime_option=runtime_option)
+model_file = os.path.join(args.model, "model.pdmodel")
+params_file = os.path.join(args.model, "model.pdiparams")
+model = fd.vision.detection.YOLOv5(
+    model_file,
+    params_file,
+    runtime_option=runtime_option,
+    model_format=fd.ModelFormat.PADDLE)
 
 # 预测图片检测结果
 if args.image is None:
diff --git a/fastdeploy/backends/lite/lite_backend.cc b/fastdeploy/backends/lite/lite_backend.cc
index 7e3e09f8d..20afa5e28 100755
--- a/fastdeploy/backends/lite/lite_backend.cc
+++ b/fastdeploy/backends/lite/lite_backend.cc
@@ -43,24 +43,33 @@ void LiteBackend::BuildOption(const LiteBackendOption& option) {
   option_ = option;
   std::vector<paddle::lite_api::Place> valid_places;
   if (option_.enable_int8) {
-    valid_places.push_back(
+    if(option_.enable_xpu) {
+      valid_places.push_back(
+          paddle::lite_api::Place{TARGET(kXPU), PRECISION(kInt8)});
+    } else {
+      valid_places.push_back(
         paddle::lite_api::Place{TARGET(kARM), PRECISION(kInt8)});
+    }
     FDINFO << "Lite::Backend enable_int8 option is ON ! Lite::Backend will "
            << "inference with int8 precision!" << std::endl;    
   }
   if (option_.enable_fp16) {
-    paddle::lite_api::MobileConfig check_fp16_config;
-    // Determine whether the device supports the FP16
-    // instruction set (or whether it is an arm device
-    // of the armv8.2 architecture)
-    supported_fp16_ = check_fp16_config.check_fp16_valid();
-    if (supported_fp16_) {
+    if(option_.enable_xpu){
       valid_places.push_back(
-          paddle::lite_api::Place{TARGET(kARM), PRECISION(kFP16)});
-      FDINFO << "Your device is supported fp16 ! Lite::Backend will "
-             << "inference with fp16 precision!" << std::endl;    
+          paddle::lite_api::Place{TARGET(kXPU), PRECISION(kFP16)});
     } else {
-      FDWARNING << "This device is not supported fp16, will skip fp16 option.";
+      paddle::lite_api::MobileConfig check_fp16_config;
+      // Determine whether the device supports the FP16
+      // instruction set (or whether it is an arm device
+      // of the armv8.2 architecture)
+      supported_fp16_ = check_fp16_config.check_fp16_valid();
+      if (supported_fp16_) {
+        valid_places.push_back(
+            paddle::lite_api::Place{TARGET(kARM), PRECISION(kFP16)});
+        FDINFO << "The device supports FP16, Lite::Backend will inference with FP16 precision." << std::endl;    
+      } else {
+        FDWARNING << "The device doesn't support FP16, will fallback to FP32.";
+      }
     }
   }
   if (!option_.nnadapter_subgraph_partition_config_path.empty()) {
@@ -81,8 +90,24 @@ void LiteBackend::BuildOption(const LiteBackendOption& option) {
     valid_places.push_back(
         paddle::lite_api::Place{TARGET(kARM), PRECISION(kInt8)});
   }
-  valid_places.push_back(
+  
+  if(option_.enable_xpu){
+    valid_places.push_back(
+      paddle::lite_api::Place{TARGET(kXPU), PRECISION(kFloat)});
+    valid_places.push_back(
+      paddle::lite_api::Place{TARGET(kX86), PRECISION(kFloat)});
+    config_.set_xpu_dev_per_thread(option_.device_id);
+    config_.set_xpu_workspace_l3_size_per_thread(option_.xpu_l3_workspace_size);
+    config_.set_xpu_l3_cache_method(option_.xpu_l3_workspace_size, option_.xpu_locked);
+    config_.set_xpu_conv_autotune(option_.xpu_autotune, option_.xpu_autotune_file);
+    config_.set_xpu_multi_encoder_method(option_.xpu_precision, option_.xpu_adaptive_seqlen);
+    if (option_.xpu_enable_multi_stream) {
+      config_.enable_xpu_multi_stream();
+    }
+  } else {
+    valid_places.push_back(
       paddle::lite_api::Place{TARGET(kARM), PRECISION(kFloat)});
+  }
   config_.set_valid_places(valid_places);
   if (option_.threads > 0) {
     config_.set_threads(option_.threads);
@@ -160,7 +185,9 @@ bool LiteBackend::InitFromPaddle(const std::string& model_file,
     auto shape = tensor->shape();
     info.shape.assign(shape.begin(), shape.end());
     info.name = output_names[i];
-    info.dtype = LiteDataTypeToFD(tensor->precision());
+    if(!option_.enable_xpu){
+      info.dtype = LiteDataTypeToFD(tensor->precision());
+    }
     outputs_desc_.emplace_back(info);
   }
 
@@ -239,6 +266,9 @@ bool LiteBackend::Infer(std::vector<FDTensor>& inputs,
   outputs->resize(outputs_desc_.size());
   for (size_t i = 0; i < outputs_desc_.size(); ++i) {
     auto tensor = predictor_->GetOutput(i);
+    if(outputs_desc_[i].dtype != LiteDataTypeToFD(tensor->precision())){
+      outputs_desc_[i].dtype = LiteDataTypeToFD(tensor->precision());
+    }
     (*outputs)[i].Resize(tensor->shape(), outputs_desc_[i].dtype,
                          outputs_desc_[i].name);
     memcpy((*outputs)[i].MutableData(), tensor->data<void>(),
diff --git a/fastdeploy/backends/lite/lite_backend.h b/fastdeploy/backends/lite/lite_backend.h
index 279acf5df..0221f507f 100755
--- a/fastdeploy/backends/lite/lite_backend.h
+++ b/fastdeploy/backends/lite/lite_backend.h
@@ -45,6 +45,15 @@ struct LiteBackendOption {
   // Such as fp16, different device target (kARM/kXPU/kNPU/...)
   std::string nnadapter_subgraph_partition_config_path = "";
   bool enable_timvx = false;
+  bool enable_xpu = false;
+  int device_id = 0;
+  int xpu_l3_workspace_size = 0xfffc00;
+  bool xpu_locked = false;
+  bool xpu_autotune = true;
+  std::string xpu_autotune_file = "";
+  std::string xpu_precision = "int16";
+  bool xpu_adaptive_seqlen = false;
+  bool xpu_enable_multi_stream = false;
 };
 
 // Convert data type from paddle lite to fastdeploy
diff --git a/fastdeploy/core/fd_type.cc b/fastdeploy/core/fd_type.cc
index ba3319dbc..3624b732d 100755
--- a/fastdeploy/core/fd_type.cc
+++ b/fastdeploy/core/fd_type.cc
@@ -62,6 +62,9 @@ std::string Str(const Device& d) {
     case Device::TIMVX:
       out = "Device::TIMVX";
       break;
+    case Device::XPU:
+      out = "Device::XPU";
+      break;
     default:
       out = "Device::UNKOWN";
   }
@@ -82,6 +85,9 @@ std::ostream& operator<<(std::ostream& out,const Device& d){
   case Device::TIMVX:
     out << "Device::TIMVX";
     break;
+  case Device::XPU:
+    out << "Device::XPU";
+    break;
   default:
     out << "Device::UNKOWN";
   }
diff --git a/fastdeploy/core/fd_type.h b/fastdeploy/core/fd_type.h
index ba18d8e36..d39c56fdf 100755
--- a/fastdeploy/core/fd_type.h
+++ b/fastdeploy/core/fd_type.h
@@ -22,7 +22,7 @@
 
 namespace fastdeploy {
 
-enum FASTDEPLOY_DECL Device { CPU, GPU, RKNPU, IPU, TIMVX};
+enum FASTDEPLOY_DECL Device { CPU, GPU, RKNPU, IPU, TIMVX, XPU};
 
 FASTDEPLOY_DECL std::string Str(const Device& d);
 
diff --git a/fastdeploy/fastdeploy_model.cc b/fastdeploy/fastdeploy_model.cc
index ad8c1329d..4d7a8e364 100755
--- a/fastdeploy/fastdeploy_model.cc
+++ b/fastdeploy/fastdeploy_model.cc
@@ -51,6 +51,7 @@ bool FastDeployModel::InitRuntimeWithSpecifiedBackend() {
   bool use_ipu = (runtime_option.device == Device::IPU);
   bool use_rknpu = (runtime_option.device == Device::RKNPU);
   bool use_timvx = (runtime_option.device == Device::TIMVX);
+  bool use_xpu = (runtime_option.device == Device::XPU);
 
   if (use_gpu) {
     if (!IsSupported(valid_gpu_backends, runtime_option.backend)) {
@@ -67,6 +68,11 @@ bool FastDeployModel::InitRuntimeWithSpecifiedBackend() {
       FDERROR << "The valid timvx backends of model " << ModelName() << " are " << Str(valid_timvx_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
       return false;
     }
+  } else if (use_xpu) {
+    if (!IsSupported(valid_xpu_backends, runtime_option.backend)) {
+      FDERROR << "The valid xpu backends of model " << ModelName() << " are " << Str(valid_xpu_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
+      return false;
+    }
   } else if(use_ipu) {
     if (!IsSupported(valid_ipu_backends, runtime_option.backend)) {
       FDERROR << "The valid ipu backends of model " << ModelName() << " are " << Str(valid_ipu_backends) << ", " << runtime_option.backend << " is not supported." << std::endl;
@@ -102,6 +108,8 @@ bool FastDeployModel::InitRuntimeWithSpecifiedDevice() {
     return CreateRKNPUBackend();
   } else if (runtime_option.device == Device::TIMVX) {
     return CreateTimVXBackend();
+  } else if (runtime_option.device == Device::XPU) {
+    return CreateXPUBackend();
   } else if (runtime_option.device == Device::IPU) {
 #ifdef WITH_IPU
     return CreateIpuBackend();
@@ -111,7 +119,7 @@ bool FastDeployModel::InitRuntimeWithSpecifiedDevice() {
     return false;
 #endif
   }
-  FDERROR << "Only support CPU/GPU/IPU/RKNPU/TIMVX now." << std::endl;
+  FDERROR << "Only support CPU/GPU/IPU/RKNPU/TIMVX/XPU now." << std::endl;
   return false;
 }
 
@@ -225,6 +233,29 @@ bool FastDeployModel::CreateTimVXBackend() {
   return false;
 }
 
+bool FastDeployModel::CreateXPUBackend() {
+  if (valid_xpu_backends.size() == 0) {
+    FDERROR << "There's no valid xpu backends for model: " << ModelName()
+            << std::endl;
+    return false;
+  }
+
+  for (size_t i = 0; i < valid_xpu_backends.size(); ++i) {
+    if (!IsBackendAvailable(valid_xpu_backends[i])) {
+      continue;
+    }
+    runtime_option.backend = valid_xpu_backends[i];
+    runtime_ = std::unique_ptr<Runtime>(new Runtime());
+    if (!runtime_->Init(runtime_option)) {
+      return false;
+    }
+    runtime_initialized_ = true;
+    return true;
+  }
+  FDERROR << "Found no valid backend for model: " << ModelName() << std::endl;
+  return false;
+}
+
 bool FastDeployModel::CreateIpuBackend() {
   if (valid_ipu_backends.size() == 0) {
     FDERROR << "There's no valid ipu backends for model: " << ModelName()
diff --git a/fastdeploy/fastdeploy_model.h b/fastdeploy/fastdeploy_model.h
index 5a6efba09..5c8809196 100755
--- a/fastdeploy/fastdeploy_model.h
+++ b/fastdeploy/fastdeploy_model.h
@@ -45,6 +45,9 @@ class FASTDEPLOY_DECL FastDeployModel {
   /** Model's valid timvx backends. This member defined all the timvx backends have successfully tested for the model
    */
   std::vector<Backend> valid_timvx_backends = {};
+  /** Model's valid KunlunXin xpu backends. This member defined all the KunlunXin xpu backends have successfully tested for the model
+   */
+  std::vector<Backend> valid_xpu_backends = {};
   /** Model's valid hardware backends. This member defined all the gpu backends have successfully tested for the model
    */
   std::vector<Backend> valid_rknpu_backends = {};
@@ -143,6 +146,7 @@ class FASTDEPLOY_DECL FastDeployModel {
   bool CreateIpuBackend();
   bool CreateRKNPUBackend();
   bool CreateTimVXBackend();
+  bool CreateXPUBackend();
 
   std::shared_ptr<Runtime> runtime_;
   bool runtime_initialized_ = false;
diff --git a/fastdeploy/pybind/runtime.cc b/fastdeploy/pybind/runtime.cc
old mode 100644
new mode 100755
index 75767c665..d0cb0b5f8
--- a/fastdeploy/pybind/runtime.cc
+++ b/fastdeploy/pybind/runtime.cc
@@ -23,6 +23,7 @@ void BindRuntime(pybind11::module& m) {
       .def("use_gpu", &RuntimeOption::UseGpu)
       .def("use_cpu", &RuntimeOption::UseCpu)
       .def("use_rknpu2", &RuntimeOption::UseRKNPU2)
+      .def("use_xpu", &RuntimeOption::UseXpu)
       .def("set_external_stream", &RuntimeOption::SetExternalStream)
       .def("set_cpu_thread_num", &RuntimeOption::SetCpuThreadNum)
       .def("use_paddle_backend", &RuntimeOption::UsePaddleBackend)
@@ -100,7 +101,21 @@ void BindRuntime(pybind11::module& m) {
       .def_readwrite("ipu_available_memory_proportion",
                      &RuntimeOption::ipu_available_memory_proportion)
       .def_readwrite("ipu_enable_half_partial",
-                     &RuntimeOption::ipu_enable_half_partial);
+                     &RuntimeOption::ipu_enable_half_partial)
+      .def_readwrite("xpu_l3_workspace_size",
+                     &RuntimeOption::xpu_l3_workspace_size)
+      .def_readwrite("xpu_locked",
+                     &RuntimeOption::xpu_locked)
+      .def_readwrite("xpu_autotune",
+                     &RuntimeOption::xpu_autotune)
+      .def_readwrite("xpu_autotune_file",
+                     &RuntimeOption::xpu_autotune_file)
+      .def_readwrite("xpu_precision",
+                     &RuntimeOption::xpu_precision)
+      .def_readwrite("xpu_adaptive_seqlen",
+                     &RuntimeOption::xpu_adaptive_seqlen)
+      .def_readwrite("xpu_enable_multi_stream",
+                     &RuntimeOption::xpu_enable_multi_stream);                              
 
   pybind11::class_<TensorInfo>(m, "TensorInfo")
       .def_readwrite("name", &TensorInfo::name)
diff --git a/fastdeploy/runtime.cc b/fastdeploy/runtime.cc
old mode 100644
new mode 100755
index 1a51cebea..565c10607
--- a/fastdeploy/runtime.cc
+++ b/fastdeploy/runtime.cc
@@ -236,7 +236,26 @@ void RuntimeOption::UseRKNPU2(fastdeploy::rknpu2::CpuName rknpu2_name,
 void RuntimeOption::UseTimVX() {
   enable_timvx = true;
   device = Device::TIMVX;
-  UseLiteBackend();
+}
+
+void RuntimeOption::UseXpu(int xpu_id, 
+                          int l3_workspace_size,
+                          bool locked,
+                          bool autotune,
+                          const std::string &autotune_file,
+                          const std::string &precision,
+                          bool adaptive_seqlen,
+                          bool enable_multi_stream) {
+  enable_xpu = true;
+  device_id = xpu_id;
+  xpu_l3_workspace_size = l3_workspace_size;
+  xpu_locked=locked;
+  xpu_autotune=autotune;
+  xpu_autotune_file=autotune_file;
+  xpu_precision = precision;
+  xpu_adaptive_seqlen=adaptive_seqlen;
+  xpu_enable_multi_stream=enable_multi_stream;
+  device = Device::XPU;
 }
 
 void RuntimeOption::SetExternalStream(void* external_stream) {
@@ -532,8 +551,8 @@ bool Runtime::Init(const RuntimeOption& _option) {
     FDINFO << "Runtime initialized with Backend::OPENVINO in "
            << Str(option.device) << "." << std::endl;
   } else if (option.backend == Backend::LITE) {
-    FDASSERT(option.device == Device::CPU || option.device == Device::TIMVX,
-             "Backend::LITE only supports Device::CPU/Device::TIMVX.");
+    FDASSERT(option.device == Device::CPU || option.device == Device::TIMVX || option.device == Device::XPU,
+             "Backend::LITE only supports Device::CPU/Device::TIMVX/Device::XPU.");
     CreateLiteBackend();
     FDINFO << "Runtime initialized with Backend::LITE in " << Str(option.device)
            << "." << std::endl;
@@ -784,6 +803,16 @@ void Runtime::CreateLiteBackend() {
   lite_option.nnadapter_subgraph_partition_config_path =
       option.lite_nnadapter_subgraph_partition_config_path;
   lite_option.enable_timvx = option.enable_timvx;
+  lite_option.enable_xpu = option.enable_xpu;
+  lite_option.device_id  = option.device_id;
+  lite_option.xpu_l3_workspace_size  = option.xpu_l3_workspace_size;
+  lite_option.xpu_locked = option.xpu_locked;
+  lite_option.xpu_autotune = option.xpu_autotune;
+  lite_option.xpu_autotune_file = option.xpu_autotune_file;
+  lite_option.xpu_precision  = option.xpu_precision;
+  lite_option.xpu_adaptive_seqlen = option.xpu_adaptive_seqlen;
+  lite_option.xpu_enable_multi_stream = option.xpu_enable_multi_stream;
+
   FDASSERT(option.model_format == ModelFormat::PADDLE,
            "LiteBackend only support model format of ModelFormat::PADDLE");
   backend_ = utils::make_unique<LiteBackend>();
diff --git a/fastdeploy/runtime.h b/fastdeploy/runtime.h
index 9c22c929f..064be2fce 100755
--- a/fastdeploy/runtime.h
+++ b/fastdeploy/runtime.h
@@ -102,6 +102,37 @@ struct FASTDEPLOY_DECL RuntimeOption {
   /// Use TimVX to inference
   void UseTimVX();
 
+  ///
+  /// \brief Turn on XPU.
+  ///
+  /// \param xpu_id the XPU card to use (default is 0).
+  /// \param l3_workspace_size The size of the video memory allocated by the l3
+  ///         cache, the maximum is 16M.
+  /// \param locked Whether the allocated L3 cache can be locked. If false,
+  ///       it means that the L3 cache is not locked, and the allocated L3
+  ///       cache can be shared by multiple models, and multiple models
+  ///       sharing the L3 cache will be executed sequentially on the card.
+  /// \param autotune Whether to autotune the conv operator in the model. If
+  ///       true, when the conv operator of a certain dimension is executed
+  ///       for the first time, it will automatically search for a better
+  ///       algorithm to improve the performance of subsequent conv operators
+  ///       of the same dimension.
+  /// \param autotune_file Specify the path of the autotune file. If
+  ///       autotune_file is specified, the algorithm specified in the
+  ///       file will be used and autotune will not be performed again.
+  /// \param precision Calculation accuracy of multi_encoder
+  /// \param adaptive_seqlen Is the input of multi_encoder variable length
+  /// \param enable_multi_stream Whether to enable the multi stream of xpu.
+  ///
+  void UseXpu(int xpu_id = 0,
+              int l3_workspace_size = 0xfffc00,
+              bool locked = false,
+              bool autotune = true,
+              const std::string& autotune_file = "",
+              const std::string& precision = "int16",
+              bool adaptive_seqlen = false,
+              bool enable_multi_stream = false);
+
   void SetExternalStream(void* external_stream);
 
   /*
@@ -354,6 +385,7 @@ struct FASTDEPLOY_DECL RuntimeOption {
   std::string lite_optimized_model_dir = "";
   std::string lite_nnadapter_subgraph_partition_config_path = "";
   bool enable_timvx = false;
+  bool enable_xpu = false;
 
   // ======Only for Trt Backend=======
   std::map<std::string, std::vector<int32_t>> trt_max_shape;
@@ -386,6 +418,15 @@ struct FASTDEPLOY_DECL RuntimeOption {
   fastdeploy::rknpu2::CoreMask rknpu2_core_mask_ =
       fastdeploy::rknpu2::CoreMask::RKNN_NPU_CORE_AUTO;
 
+  // ======Only for XPU Backend=======
+  int xpu_l3_workspace_size = 0xfffc00;
+  bool xpu_locked = false;
+  bool xpu_autotune = true;
+  std::string xpu_autotune_file = "";
+  std::string xpu_precision = "int16";
+  bool xpu_adaptive_seqlen = false;
+  bool xpu_enable_multi_stream = false;
+
   std::string model_file = "";   // Path of model file
   std::string params_file = "";  // Path of parameters file, can be empty
   // format of input model
diff --git a/fastdeploy/vision/classification/ppcls/model.cc b/fastdeploy/vision/classification/ppcls/model.cc
index 5065bbfc2..e1b8d5249 100755
--- a/fastdeploy/vision/classification/ppcls/model.cc
+++ b/fastdeploy/vision/classification/ppcls/model.cc
@@ -29,6 +29,7 @@ PaddleClasModel::PaddleClasModel(const std::string& model_file,
                           Backend::LITE};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     valid_timvx_backends = {Backend::LITE};
+    valid_xpu_backends = {Backend::LITE};
     valid_ipu_backends = {Backend::PDINFER};
   } else if (model_format == ModelFormat::ONNX) {
     valid_cpu_backends = {Backend::ORT, Backend::OPENVINO};
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
index 238c1c465..6dcda3b77 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
@@ -72,10 +72,11 @@ class FASTDEPLOY_DECL RKYOLOPostprocessor {
   }
 
   // Set Anchor
-  void SetAnchor(std::vector<int> anchors,int anchor_per_branch){
+  void SetAnchor(std::vector<int> anchors, int anchor_per_branch) {
       anchors_ = anchors;
       anchor_per_branch_ = anchor_per_branch;
-  };
+  }
+
  private:
   std::vector<int> anchors_ = {10, 13, 16,  30,  33, 23,  30,  61,  62,
                                45, 59, 119, 116, 90, 156, 198, 373, 326};
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/utils.h b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
index 1d28b5f0e..1fa533082 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/utils.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/utils.h
@@ -31,4 +31,4 @@ int NMS(int valid_count, std::vector<float>& output_locations,
 
 }  // namespace detection
 }  // namespace vision
-}  // namespace fastdeploy
\ No newline at end of file
+}  // namespace fastdeploy
diff --git a/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc b/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
index 92d53dd10..d1bb31f22 100755
--- a/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
+++ b/fastdeploy/vision/detection/contrib/yolov5/yolov5.cc
@@ -27,6 +27,7 @@ YOLOv5::YOLOv5(const std::string& model_file, const std::string& params_file,
   } else {
     valid_cpu_backends = {Backend::PDINFER, Backend::ORT, Backend::LITE};
     valid_gpu_backends = {Backend::PDINFER, Backend::ORT, Backend::TRT};
+    valid_xpu_backends = {Backend::LITE};
     valid_timvx_backends = {Backend::LITE};
   }
   runtime_option = custom_option;
diff --git a/fastdeploy/vision/detection/ppdet/model.h b/fastdeploy/vision/detection/ppdet/model.h
index 5175bc4e6..090c99de7 100755
--- a/fastdeploy/vision/detection/ppdet/model.h
+++ b/fastdeploy/vision/detection/ppdet/model.h
@@ -185,7 +185,7 @@ class FASTDEPLOY_DECL PaddleYOLOv5 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::ORT,Backend::PDINFER};
+    valid_cpu_backends = {Backend::ORT, Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
@@ -201,7 +201,7 @@ class FASTDEPLOY_DECL PaddleYOLOv6 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::OPENVINO, Backend::ORT,Backend::PDINFER};
+    valid_cpu_backends = {Backend::OPENVINO, Backend::ORT, Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
@@ -217,7 +217,7 @@ class FASTDEPLOY_DECL PaddleYOLOv7 : public PPDetBase {
                const ModelFormat& model_format = ModelFormat::PADDLE)
       : PPDetBase(model_file, params_file, config_file, custom_option,
                 model_format) {
-    valid_cpu_backends = {Backend::ORT,Backend::PDINFER};
+    valid_cpu_backends = {Backend::ORT, Backend::PDINFER};
     valid_gpu_backends = {Backend::ORT, Backend::PDINFER, Backend::TRT};
     initialized = Initialize();
   }
diff --git a/python/fastdeploy/runtime.py b/python/fastdeploy/runtime.py
index 6461da66d..f9334efbf 100755
--- a/python/fastdeploy/runtime.py
+++ b/python/fastdeploy/runtime.py
@@ -245,6 +245,34 @@ class RuntimeOption:
             return
         return self._option.use_gpu(device_id)
 
+    def use_xpu(self,
+                device_id=0,
+                l3_workspace_size=16 * 1024 * 1024,
+                locked=False,
+                autotune=True,
+                autotune_file="",
+                precision="int16",
+                adaptive_seqlen=False,
+                enable_multi_stream=False):
+        """Inference with XPU
+
+        :param device_id: (int)The index of XPU will be used for inference, default 0
+        :param l3_workspace_size: (int)The size of the video memory allocated by the l3 cache, the maximum is 16M, default 16M
+        :param locked: (bool)Whether the allocated L3 cache can be locked. If false, it means that the L3 cache is not locked,
+                        and the allocated L3 cache can be shared by multiple models, and multiple models
+        :param autotune: (bool)Whether to autotune the conv operator in the model.
+                        If true, when the conv operator of a certain dimension is executed for the first time,
+                        it will automatically search for a better algorithm to improve the performance of subsequent conv operators of the same dimension.
+        :param autotune_file: (str)Specify the path of the autotune file. If autotune_file is specified,
+                        the algorithm specified in the file will be used and autotune will not be performed again.
+        :param precision: (str)Calculation accuracy of multi_encoder
+        :param adaptive_seqlen: (bool)adaptive_seqlen Is the input of multi_encoder variable length
+        :param enable_multi_stream: (bool)Whether to enable the multi stream of xpu.
+        """
+        return self._option.use_xpu(device_id, l3_workspace_size, locked,
+                                    autotune, autotune_file, precision,
+                                    adaptive_seqlen, enable_multi_stream)
+
     def use_cpu(self):
         """Inference with CPU
         """
diff --git a/python/setup.py b/python/setup.py
index b4dc111c6..19a857678 100755
--- a/python/setup.py
+++ b/python/setup.py
@@ -65,11 +65,13 @@ setup_configs["ENABLE_POROS_BACKEND"] = os.getenv("ENABLE_POROS_BACKEND",
                                                   "OFF")
 setup_configs["ENABLE_TRT_BACKEND"] = os.getenv("ENABLE_TRT_BACKEND", "OFF")
 setup_configs["ENABLE_LITE_BACKEND"] = os.getenv("ENABLE_LITE_BACKEND", "OFF")
+setup_configs["PADDLELITE_URL"] = os.getenv("PADDLELITE_URL", "OFF")
 setup_configs["ENABLE_VISION"] = os.getenv("ENABLE_VISION", "OFF")
 setup_configs["ENABLE_FLYCV"] = os.getenv("ENABLE_FLYCV", "OFF")
 setup_configs["ENABLE_TEXT"] = os.getenv("ENABLE_TEXT", "OFF")
 setup_configs["WITH_GPU"] = os.getenv("WITH_GPU", "OFF")
 setup_configs["WITH_IPU"] = os.getenv("WITH_IPU", "OFF")
+setup_configs["WITH_XPU"] = os.getenv("WITH_XPU", "OFF")
 setup_configs["BUILD_ON_JETSON"] = os.getenv("BUILD_ON_JETSON", "OFF")
 setup_configs["TRT_DIRECTORY"] = os.getenv("TRT_DIRECTORY", "UNDEFINED")
 setup_configs["CUDA_DIRECTORY"] = os.getenv("CUDA_DIRECTORY",
@@ -78,10 +80,12 @@ setup_configs["LIBRARY_NAME"] = PACKAGE_NAME
 setup_configs["PY_LIBRARY_NAME"] = PACKAGE_NAME + "_main"
 setup_configs["OPENCV_DIRECTORY"] = os.getenv("OPENCV_DIRECTORY", "")
 setup_configs["ORT_DIRECTORY"] = os.getenv("ORT_DIRECTORY", "")
-setup_configs["PADDLEINFERENCE_DIRECTORY"] = os.getenv("PADDLEINFERENCE_DIRECTORY", "")
+setup_configs["PADDLEINFERENCE_DIRECTORY"] = os.getenv(
+    "PADDLEINFERENCE_DIRECTORY", "")
 
 setup_configs["RKNN2_TARGET_SOC"] = os.getenv("RKNN2_TARGET_SOC", "")
-if setup_configs["RKNN2_TARGET_SOC"] != "" or setup_configs["BUILD_ON_JETSON"] != "OFF":
+if setup_configs["RKNN2_TARGET_SOC"] != "" or setup_configs[
+        "BUILD_ON_JETSON"] != "OFF":
     REQUIRED_PACKAGES = REQUIRED_PACKAGES.replace("opencv-python", "")
 
 if setup_configs["WITH_GPU"] == "ON" or setup_configs[

From 6060f4060b935c9a41db916e6c87ce1afd05cba5 Mon Sep 17 00:00:00 2001
From: DefTruth <31974251+DefTruth@users.noreply.github.com>
Date: Fri, 16 Dec 2022 13:29:56 +0800
Subject: [PATCH 72/77] [Bug Fix] fix lite int64 datatype convert (#892)

Co-authored-by: Jason <jiangjiajun@baidu.com>
---
 fastdeploy/backends/lite/lite_backend.cc | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fastdeploy/backends/lite/lite_backend.cc b/fastdeploy/backends/lite/lite_backend.cc
index 20afa5e28..c2a783ea4 100755
--- a/fastdeploy/backends/lite/lite_backend.cc
+++ b/fastdeploy/backends/lite/lite_backend.cc
@@ -249,12 +249,12 @@ bool LiteBackend::Infer(std::vector<FDTensor>& inputs,
         reinterpret_cast<const uint8_t*>(const_cast<void*>(
         inputs[i].CpuData())));
     } else if (inputs[i].dtype == FDDataType::INT64) {
-#ifdef __aarch64__      
+#if (defined(__aarch64__) || defined(__x86_64__) || defined(_M_X64) || defined(_M_ARM64))      
       tensor->CopyFromCpu<int64_t, paddle::lite_api::TargetType::kHost>(
         reinterpret_cast<const int64_t*>(const_cast<void*>(
         inputs[i].CpuData())));
 #else 
-      FDASSERT(false, "FDDataType::INT64 is not support for Arm v7 now!");         
+      FDASSERT(false, "FDDataType::INT64 is not support for x86/armv7 now!");         
 #endif        
     } else {
       FDASSERT(false, "Unexpected data type of %d.", inputs[i].dtype);

From 1798ad69ed3ddf2b6eda064cc5ff161df10712ad Mon Sep 17 00:00:00 2001
From: leiqing <54695910+leiqing1@users.noreply.github.com>
Date: Sun, 18 Dec 2022 12:08:25 +0800
Subject: [PATCH 73/77] update readme in other languages (#903)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* Delete README_한국어.md

* Delete README_Ру́сский_язы́к.md

* Delete README_हिन्दी.md

* Create README_Pу́сский язы́к.md

* Create README_हिन्दी.md

* Create README_한국인.md
---
 .../{README_Ру́сский_язы́к.md => README_Pу́сский язы́к.md}          | 0
 docs/docs_i18n/README_हिन्दी.md                                  | 2 +-
 docs/docs_i18n/{README_한국어.md => README_한국인.md}           | 0
 3 files changed, 1 insertion(+), 1 deletion(-)
 rename docs/docs_i18n/{README_Ру́сский_язы́к.md => README_Pу́сский язы́к.md} (100%)
 rename docs/docs_i18n/{README_한국어.md => README_한국인.md} (100%)

diff --git a/docs/docs_i18n/README_Ру́сский_язы́к.md b/docs/docs_i18n/README_Pу́сский язы́к.md
similarity index 100%
rename from docs/docs_i18n/README_Ру́сский_язы́к.md
rename to docs/docs_i18n/README_Pу́сский язы́к.md
diff --git a/docs/docs_i18n/README_हिन्दी.md b/docs/docs_i18n/README_हिन्दी.md
index 46113bee8..62ce1a886 100644
--- a/docs/docs_i18n/README_हिन्दी.md
+++ b/docs/docs_i18n/README_हिन्दी.md
@@ -1,4 +1,4 @@
-[English](../../README_EN.md) | [简体中文](../../README_CN.md) | हिन्दी | [日本語](./README_日本語.md) | [한국인](./README_한국어.md) | [Pу́сский язы́к](.//README_Ру́сский_язы́к.md)
+  [English](../../README_EN.md) | [简体中文](../../README_CN.md) | हिन्दी | [日本語](./README_日本語.md) | [한국인](./README_한국어.md) | [Pу́сский язы́к](.//README_Ру́сский_язы́к.md)
 
 ![⚡️FastDeploy](https://user-images.githubusercontent.com/31974251/185771818-5d4423cd-c94c-4a49-9894-bc7a8d1c29d0.png)
 
diff --git a/docs/docs_i18n/README_한국어.md b/docs/docs_i18n/README_한국인.md
similarity index 100%
rename from docs/docs_i18n/README_한국어.md
rename to docs/docs_i18n/README_한국인.md

From 95beb2bbf65654d03b65360ec10f815d918817a7 Mon Sep 17 00:00:00 2001
From: Zheng_Bicheng <58363586+Zheng-Bicheng@users.noreply.github.com>
Date: Mon, 19 Dec 2022 10:03:18 +0800
Subject: [PATCH 74/77] [RKNPU2] RKYOLO Support FP32 return value (#898)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* RKNPU2 Backend兼容其他模型的量化
fd_tensor正式移除zp和scale的量化参数

* 更新FP32返回值的RKYOLO

* 更新rkyolov5支持fp32格式

* 更新rkyolov5支持fp32格式

* 更新YOLOv5速度文档

Co-authored-by: DefTruth <31974251+DefTruth@users.noreply.github.com>
---
 docs/cn/faq/rknpu2/rknpu2.md                  |  1 +
 .../detection/rkyolo/cpp/infer_rkyolo.cc      |  6 +-
 .../backends/rknpu/rknpu2/rknpu2_backend.cc   | 48 +++++------
 fastdeploy/core/fd_tensor.cc                  | 10 ---
 fastdeploy/core/fd_tensor.h                   |  4 -
 .../detection/contrib/rknpu2/postprocessor.cc | 81 +++++++++----------
 .../detection/contrib/rknpu2/postprocessor.h  | 16 ++--
 .../detection/contrib/rknpu2/preprocessor.cc  | 18 -----
 .../detection/contrib/rknpu2/preprocessor.h   |  1 -
 .../vision/detection/contrib/rknpu2/rkyolo.cc |  9 +--
 10 files changed, 76 insertions(+), 118 deletions(-)

diff --git a/docs/cn/faq/rknpu2/rknpu2.md b/docs/cn/faq/rknpu2/rknpu2.md
index 0e1f920d6..c3a424af4 100644
--- a/docs/cn/faq/rknpu2/rknpu2.md
+++ b/docs/cn/faq/rknpu2/rknpu2.md
@@ -15,6 +15,7 @@ ONNX模型不能直接调用RK芯片中的NPU进行运算，需要把ONNX模型
 | 任务场景             | 模型                | 模型版本(表示已经测试的版本)               | ARM CPU/RKNN速度(ms) |
 |------------------|-------------------|-------------------------------|--------------------|
 | Detection        | Picodet           | Picodet-s                     | 162/112            |
+| Detection        | RKYOLOV5          | YOLOV5-S-Relu(int8)           | -/57               |
 | Segmentation     | Unet              | Unet-cityscapes               | -/-                |
 | Segmentation     | PP-LiteSeg        | PP_LiteSeg_T_STDC1_cityscapes | -/-                |
 | Segmentation     | PP-HumanSegV2Lite | portrait                      | 53/50              |
diff --git a/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc b/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
index 86ba7f985..3433c1f41 100644
--- a/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
+++ b/examples/vision/detection/rkyolo/cpp/infer_rkyolo.cc
@@ -25,12 +25,16 @@ void RKNPU2Infer(const std::string& model_file, const std::string& image_file) {
   auto im = cv::imread(image_file);
 
   fastdeploy::vision::DetectionResult res;
+  fastdeploy::TimeCounter tc;
+  tc.Start();
   if (!model.Predict(im, &res)) {
     std::cerr << "Failed to predict." << std::endl;
     return;
   }
-  std::cout << res.Str() << std::endl;
   auto vis_im = fastdeploy::vision::VisDetection(im, res,0.5);
+  tc.End();
+  tc.PrintInfo("RKYOLOV5 in RKNN");
+  std::cout << res.Str() << std::endl;
   cv::imwrite("vis_result.jpg", vis_im);
   std::cout << "Visualized result saved in ./vis_result.jpg" << std::endl;
 }
diff --git a/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc b/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
index 8046fd87a..ac9429450 100644
--- a/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
+++ b/fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.cc
@@ -12,7 +12,7 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 #include "fastdeploy/backends/rknpu/rknpu2/rknpu2_backend.h"
-
+#include "fastdeploy/utils/perf.h"
 namespace fastdeploy {
 RKNPU2Backend::~RKNPU2Backend() {
   // Release memory uniformly here
@@ -190,7 +190,6 @@ bool RKNPU2Backend::GetModelInputOutputInfos() {
       FDERROR << "rknpu2_backend only support input format is NHWC or UNDEFINED" << std::endl;
     }
 
-    DumpTensorAttr(input_attrs_[i]);
 
     // copy input_attrs_ to input tensor info
     std::string temp_name = input_attrs_[i].name;
@@ -199,16 +198,13 @@ bool RKNPU2Backend::GetModelInputOutputInfos() {
     for (int j = 0; j < input_attrs_[i].n_dims; j++) {
       temp_shape[j] = (int)input_attrs_[i].dims[j];
     }
-    FDDataType temp_dtype =
-        fastdeploy::RKNPU2Backend::RknnTensorTypeToFDDataType(
-            input_attrs_[i].type);
+    FDDataType temp_dtype = fastdeploy::RKNPU2Backend::RknnTensorTypeToFDDataType(input_attrs_[i].type);
     TensorInfo temp_input_info = {temp_name, temp_shape, temp_dtype};
     inputs_desc_[i] = temp_input_info;
   }
 
   // Get detailed output parameters
-  output_attrs_ =
-      (rknn_tensor_attr*)malloc(sizeof(rknn_tensor_attr) * io_num.n_output);
+  output_attrs_ = (rknn_tensor_attr*)malloc(sizeof(rknn_tensor_attr) * io_num.n_output);
   memset(output_attrs_, 0, io_num.n_output * sizeof(rknn_tensor_attr));
   outputs_desc_.resize(io_num.n_output);
 
@@ -225,19 +221,13 @@ bool RKNPU2Backend::GetModelInputOutputInfos() {
       return false;
     }
 
-    // If the output dimension is 3, the runtime will automatically change it to 4. 
+    // If the output dimension is 3, the runtime will automatically change it to 4.
     // Obviously, this is wrong, and manual correction is required here.
     int n_dims = output_attrs_[i].n_dims;
     if((n_dims == 4) && (output_attrs_[i].dims[3] == 1)){
       n_dims--;
-      FDWARNING << "The output[" 
-                << i
-                << "].shape[3] is 1, remove this dim." 
-                << std::endl;
     }
 
-    DumpTensorAttr(output_attrs_[i]);
-
     // copy output_attrs_ to output tensor
     std::string temp_name = output_attrs_[i].name;
     std::vector<int> temp_shape{};
@@ -246,9 +236,8 @@ bool RKNPU2Backend::GetModelInputOutputInfos() {
       temp_shape[j] = (int)output_attrs_[i].dims[j];
     }
 
-    FDDataType temp_dtype =
-        fastdeploy::RKNPU2Backend::RknnTensorTypeToFDDataType(
-            output_attrs_[i].type);
+    // The data type of output data is changed to FP32
+    FDDataType temp_dtype = FDDataType::FP32;
     TensorInfo temp_input_info = {temp_name, temp_shape, temp_dtype};
     outputs_desc_[i] = temp_input_info;
   }
@@ -265,11 +254,12 @@ bool RKNPU2Backend::GetModelInputOutputInfos() {
 void RKNPU2Backend::DumpTensorAttr(rknn_tensor_attr& attr) {
   printf("index=%d, name=%s, n_dims=%d, dims=[%d, %d, %d, %d], "
          "n_elems=%d, size=%d, fmt=%s, type=%s, "
-         "qnt_type=%s, zp=%d, scale=%f\n",
+         "qnt_type=%s, zp=%d, scale=%f, pass_through=%d",
          attr.index, attr.name, attr.n_dims, attr.dims[0], attr.dims[1],
          attr.dims[2], attr.dims[3], attr.n_elems, attr.size,
          get_format_string(attr.fmt), get_type_string(attr.type),
-         get_qnt_type_string(attr.qnt_type), attr.zp, attr.scale);
+         get_qnt_type_string(attr.qnt_type), attr.zp, attr.scale,
+         attr.pass_through);
 }
 
 TensorInfo RKNPU2Backend::GetInputInfo(int index) {
@@ -320,7 +310,12 @@ bool RKNPU2Backend::Infer(std::vector<FDTensor>& inputs,
       input_attrs_[i].type = input_type;
       input_attrs_[i].size = inputs[0].Nbytes();
       input_attrs_[i].size_with_stride = inputs[0].Nbytes();
-      input_attrs_[i].pass_through = 0;
+      if(input_attrs_[i].type == RKNN_TENSOR_FLOAT16 ||
+          input_attrs_[i].type == RKNN_TENSOR_FLOAT32){
+        FDINFO << "The input model is not a quantitative model. "
+                  "Close the normalize operation." << std::endl;
+      }
+
       input_mems_[i] = rknn_create_mem(ctx, inputs[i].Nbytes());
       if (input_mems_[i] == nullptr) {
         FDERROR << "rknn_create_mem input_mems_ error." << std::endl;
@@ -345,11 +340,13 @@ bool RKNPU2Backend::Infer(std::vector<FDTensor>& inputs,
         FDERROR << "rknn_create_mem output_mems_ error." << std::endl;
         return false;
       }
-      if(output_attrs_[i].type == RKNN_TENSOR_FLOAT16){
-        output_attrs_[i].type = RKNN_TENSOR_FLOAT32;
-      }
+
+      // The data type of output data is changed to FP32
+      output_attrs_[i].type = RKNN_TENSOR_FLOAT32;
+
       // default output type is depend on model, this requires float32 to compute top5
       ret = rknn_set_io_mem(ctx, output_mems_[i], &output_attrs_[i]);
+
       // set output memory and attribute
       if (ret != RKNN_SUCC) {
         FDERROR << "output tensor memory rknn_set_io_mem fail! ret=" << ret
@@ -360,7 +357,7 @@ bool RKNPU2Backend::Infer(std::vector<FDTensor>& inputs,
 
     this->infer_init = true;
   }
-  
+
   // Copy input data to input tensor memory
   for (uint32_t i = 0; i < io_num.n_input; i++) {
     uint32_t width = input_attrs_[i].dims[2];
@@ -376,7 +373,6 @@ bool RKNPU2Backend::Infer(std::vector<FDTensor>& inputs,
       return false;
     }
   }
-  
 
   // run rknn
   ret = rknn_run(ctx, nullptr);
@@ -395,8 +391,6 @@ bool RKNPU2Backend::Infer(std::vector<FDTensor>& inputs,
     }
     (*outputs)[i].Resize(temp_shape, outputs_desc_[i].dtype,
                          outputs_desc_[i].name);
-    std::vector<float>  output_scale = {output_attrs_[i].scale};
-    (*outputs)[i].SetQuantizationInfo(output_attrs_[i].zp, output_scale);
     memcpy((*outputs)[i].MutableData(), (float*)output_mems_[i]->virt_addr,
            (*outputs)[i].Nbytes());
   }
diff --git a/fastdeploy/core/fd_tensor.cc b/fastdeploy/core/fd_tensor.cc
index 484e03913..e84535ac9 100644
--- a/fastdeploy/core/fd_tensor.cc
+++ b/fastdeploy/core/fd_tensor.cc
@@ -138,11 +138,6 @@ void FDTensor::Resize(const std::vector<int64_t>& new_shape) {
   external_data_ptr = nullptr;
 }
 
-void FDTensor::SetQuantizationInfo(int32_t zero_point,std::vector<float>& scale){
-  quantized_parameter_.first = zero_point;
-  quantized_parameter_.second = scale;
-}
-
 void FDTensor::Resize(const std::vector<int64_t>& new_shape,
                       const FDDataType& data_type,
                       const std::string& tensor_name,
@@ -455,9 +450,4 @@ FDTensor& FDTensor::operator=(FDTensor&& other) {
   return *this;
 }
 
-const std::pair<int32_t, std::vector<float>>
-FDTensor::GetQuantizationInfo() const{
-  return quantized_parameter_;
-}
-
 }  // namespace fastdeploy
diff --git a/fastdeploy/core/fd_tensor.h b/fastdeploy/core/fd_tensor.h
index e3e373c43..c6e1ed5cb 100644
--- a/fastdeploy/core/fd_tensor.h
+++ b/fastdeploy/core/fd_tensor.h
@@ -25,10 +25,6 @@
 namespace fastdeploy {
 
 struct FASTDEPLOY_DECL FDTensor {
-  // These two parameters are general parameters of quantitative model.
-  std::pair<int32_t, std::vector<float>> quantized_parameter_ = {0, {0}};
-  void SetQuantizationInfo(int32_t zero_point, std::vector<float>& scale);
-  const std::pair<int32_t, std::vector<float>> GetQuantizationInfo() const;
 
   // std::vector<int8_t> data;
   void* buffer_ = nullptr;
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
index bf8be2727..581cac2e8 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.cc
@@ -11,7 +11,6 @@
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.
-
 #include "fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h"
 #include "fastdeploy/vision/utils/utils.h"
 
@@ -38,17 +37,16 @@ bool RKYOLOPostprocessor::Run(const std::vector<FDTensor>& tensors,
       int grid_h = height_ / stride;
       int grid_w = width_ / stride;
       int* anchor = &(anchors_.data()[i * 2 * anchor_per_branch_]);
-      if (tensors[i].dtype == FDDataType::INT8 ||
-          tensors[i].dtype == FDDataType::UINT8) {
-        auto quantization_info = tensors[i].GetQuantizationInfo();
-        validCount =
-            validCount + ProcessInt8((int8_t*)tensors[i].Data() + skip_address,
-                                     anchor, grid_h, grid_w, stride,
-                                     filterBoxes, boxesScore, classId,
-                                     conf_threshold_, quantization_info.first,
-                                     quantization_info.second[0]);
+      if (tensors[i].dtype == FDDataType::FP32) {
+        validCount = validCount +
+                     ProcessFP16((float*)tensors[i].Data() + skip_address,
+                                 anchor, grid_h, grid_w, stride, filterBoxes,
+                                 boxesScore, classId, conf_threshold_);
       } else {
-        FDERROR << "RKYOLO Only Support INT8 Model" << std::endl;
+        FDERROR << "RKYOLO Only Support FP32 Model."
+            << "But the result's type is "
+            << Str(tensors[i].dtype)
+            << std::endl;
       }
     }
 
@@ -69,7 +67,7 @@ bool RKYOLOPostprocessor::Run(const std::vector<FDTensor>& tensors,
       NMS(validCount, filterBoxes, classId, indexArray, nms_threshold_, false);
     } else if (anchor_per_branch_ == 1) {
       NMS(validCount, filterBoxes, classId, indexArray, nms_threshold_, true);
-    }else{
+    } else {
       FDERROR << "anchor_per_branch_ only support 3 or 1." << std::endl;
       return false;
     }
@@ -107,60 +105,57 @@ bool RKYOLOPostprocessor::Run(const std::vector<FDTensor>& tensors,
   return true;
 }
 
-int RKYOLOPostprocessor::ProcessInt8(int8_t* input, int* anchor, int grid_h,
+int RKYOLOPostprocessor::ProcessFP16(float* input, int* anchor, int grid_h,
                                      int grid_w, int stride,
                                      std::vector<float>& boxes,
                                      std::vector<float>& boxScores,
-                                     std::vector<int>& classId, float threshold,
-                                     int32_t zp, float scale) {
+                                     std::vector<int>& classId,
+                                     float threshold) {
+
   int validCount = 0;
   int grid_len = grid_h * grid_w;
-  float thres = threshold;
-  auto thres_i8 = QntF32ToAffine(thres, zp, scale);
+  // float thres_sigmoid = threshold;
   for (int a = 0; a < anchor_per_branch_; a++) {
     for (int i = 0; i < grid_h; i++) {
       for (int j = 0; j < grid_w; j++) {
-        int8_t box_confidence =
-            input[(prob_box_size * a + 4) * grid_len + i * grid_w + j];
-        if (box_confidence >= thres_i8) {
-          int offset = (prob_box_size * a) * grid_len + i * grid_w + j;
-          int8_t* in_ptr = input + offset;
+        float box_confidence =
+            input[(prob_box_size_ * a + 4) * grid_len + i * grid_w + j];
+        if (box_confidence >= threshold) {
+          int offset = (prob_box_size_ * a) * grid_len + i * grid_w + j;
+          float* in_ptr = input + offset;
 
-          int8_t maxClassProbs = in_ptr[5 * grid_len];
+          float maxClassProbs = in_ptr[5 * grid_len];
           int maxClassId = 0;
-          for (int k = 1; k < obj_class_num; ++k) {
-            int8_t prob = in_ptr[(5 + k) * grid_len];
+          for (int k = 1; k < obj_class_num_; ++k) {
+            float prob = in_ptr[(5 + k) * grid_len];
             if (prob > maxClassProbs) {
               maxClassId = k;
               maxClassProbs = prob;
             }
           }
-
-          float box_conf_f32 = DeqntAffineToF32(box_confidence, zp, scale);
-          float class_prob_f32 = DeqntAffineToF32(maxClassProbs, zp, scale);
+          float box_conf_f32 = (box_confidence);
+          float class_prob_f32 = (maxClassProbs);
           float limit_score = 0;
           if (anchor_per_branch_ == 1) {
-            limit_score = box_conf_f32 * class_prob_f32;
-          } else {
             limit_score = class_prob_f32;
+          } else {
+            limit_score = box_conf_f32 * class_prob_f32;
           }
-          //printf("limit score: %f\n", limit_score);
+          // printf("limit score: %f", limit_score);
           if (limit_score > conf_threshold_) {
             float box_x, box_y, box_w, box_h;
             if (anchor_per_branch_ == 1) {
-              box_x = DeqntAffineToF32(*in_ptr, zp, scale);
-              box_y = DeqntAffineToF32(in_ptr[grid_len], zp, scale);
-              box_w = DeqntAffineToF32(in_ptr[2 * grid_len], zp, scale);
-              box_h = DeqntAffineToF32(in_ptr[3 * grid_len], zp, scale);
-              box_w = exp(box_w) * stride;
-              box_h = exp(box_h) * stride;
+              box_x = *in_ptr;
+              box_y = (in_ptr[grid_len]);
+              box_w = exp(in_ptr[2 * grid_len]) * stride;
+              box_h = exp(in_ptr[3 * grid_len]) * stride;
             } else {
-              box_x = DeqntAffineToF32(*in_ptr, zp, scale) * 2.0 - 0.5;
-              box_y = DeqntAffineToF32(in_ptr[grid_len], zp, scale) * 2.0 - 0.5;
-              box_w = DeqntAffineToF32(in_ptr[2 * grid_len], zp, scale) * 2.0;
-              box_h = DeqntAffineToF32(in_ptr[3 * grid_len], zp, scale) * 2.0;
-              box_w = box_w * box_w;
-              box_h = box_h * box_h;
+              box_x = *in_ptr * 2.0 - 0.5;
+              box_y = (in_ptr[grid_len]) * 2.0 - 0.5;
+              box_w = (in_ptr[2 * grid_len]) * 2.0;
+              box_h = (in_ptr[3 * grid_len]) * 2.0;
+              box_w *= box_w;
+              box_h *= box_h;
             }
             box_x = (box_x + j) * (float)stride;
             box_y = (box_y + i) * (float)stride;
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
index 6dcda3b77..b65479415 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/postprocessor.h
@@ -85,12 +85,12 @@ class FASTDEPLOY_DECL RKYOLOPostprocessor {
   int width_ = 0;
   int anchor_per_branch_ = 0;
 
-  // Process Int8 Model
-  int ProcessInt8(int8_t* input, int* anchor, int grid_h, int grid_w,
-                  int stride, std::vector<float>& boxes,
-                  std::vector<float>& boxScores, std::vector<int>& classId,
-                  float threshold, int32_t zp, float scale);
-
+  int ProcessFP16(float *input, int *anchor, int grid_h,
+              int grid_w, int stride,
+              std::vector<float> &boxes,
+              std::vector<float> &boxScores,
+              std::vector<int> &classId,
+              float threshold);
   // Model
   int QuickSortIndiceInverse(std::vector<float>& input, int left, int right,
                              std::vector<int>& indices);
@@ -100,8 +100,8 @@ class FASTDEPLOY_DECL RKYOLOPostprocessor {
   std::vector<float> scale_;
   float nms_threshold_ = 0.45;
   float conf_threshold_ = 0.25;
-  int prob_box_size = 85;
-  int obj_class_num = 80;
+  int prob_box_size_ = 85;
+  int obj_class_num_ = 80;
   int obj_num_bbox_max_size = 200;
 };
 
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
index 068004346..a5ce8849e 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
+++ b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.cc
@@ -30,16 +30,11 @@ RKYOLOPreprocessor::RKYOLOPreprocessor() {
 }
 
 void RKYOLOPreprocessor::LetterBox(FDMat* mat) {
-  std::cout << "mat->Height() = " << mat->Height() << std::endl;
-  std::cout << "mat->Width() = " << mat->Width() << std::endl;
-
   float scale =
       std::min(size_[1] * 1.0 / mat->Height(), size_[0] * 1.0 / mat->Width());
-  std::cout << "RKYOLOPreprocessor scale_ = " << scale << std::endl;
   if (!is_scale_up_) {
     scale = std::min(scale, 1.0f);
   }
-  std::cout << "RKYOLOPreprocessor scale_ = " << scale << std::endl;
   scale_.push_back(scale);
 
   int resize_h = int(round(mat->Height() * scale));
@@ -74,19 +69,6 @@ void RKYOLOPreprocessor::LetterBox(FDMat* mat) {
 }
 
 bool RKYOLOPreprocessor::Preprocess(FDMat* mat, FDTensor* output) {
-  // process after image load
-  //  float ratio = std::min(size_[1] * 1.0f / static_cast<float>(mat->Height()),
-  //                         size_[0] * 1.0f / static_cast<float>(mat->Width()));
-  //  if (std::fabs(ratio - 1.0f) > 1e-06) {
-  //    int interp = cv::INTER_AREA;
-  //    if (ratio > 1.0) {
-  //      interp = cv::INTER_LINEAR;
-  //    }
-  //    int resize_h = int(mat->Height() * ratio);
-  //    int resize_w = int(mat->Width() * ratio);
-  //    Resize::Run(mat, resize_w, resize_h, -1, -1, interp);
-  //  }
-
   // RKYOLO's preprocess steps
   // 1. letterbox
   // 2. convert_and_permute(swap_rb=true)
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h
index e6ecfe452..ad08dd751 100755
--- a/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h
+++ b/fastdeploy/vision/detection/contrib/rknpu2/preprocessor.h
@@ -18,7 +18,6 @@
 
 namespace fastdeploy {
 namespace vision {
-
 namespace detection {
 /*! @brief Preprocessor object for YOLOv5 serials model.
  */
diff --git a/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
index 524afcef1..49f5804af 100644
--- a/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
+++ b/fastdeploy/vision/detection/contrib/rknpu2/rkyolo.cc
@@ -60,11 +60,6 @@ bool RKYOLO::BatchPredict(const std::vector<cv::Mat>& images,
     FDERROR << "Failed to preprocess the input image." << std::endl;
     return false;
   }
-  auto pad_hw_values_ = preprocessor_.GetPadHWValues();
-  postprocessor_.SetPadHWValues(preprocessor_.GetPadHWValues());
-  std::cout << "preprocessor_ scale_ = " << preprocessor_.GetScale()[0]
-            << std::endl;
-  postprocessor_.SetScale(preprocessor_.GetScale());
 
   reused_input_tensors_[0].name = InputInfoOfRuntime(0).name;
   if (!Infer(reused_input_tensors_, &reused_output_tensors_)) {
@@ -72,12 +67,14 @@ bool RKYOLO::BatchPredict(const std::vector<cv::Mat>& images,
     return false;
   }
 
+  auto pad_hw_values_ = preprocessor_.GetPadHWValues();
+  postprocessor_.SetPadHWValues(preprocessor_.GetPadHWValues());
+  postprocessor_.SetScale(preprocessor_.GetScale());
   if (!postprocessor_.Run(reused_output_tensors_, results)) {
     FDERROR << "Failed to postprocess the inference results by runtime."
             << std::endl;
     return false;
   }
-
   return true;
 }
 

From 81eaeddbd0f37ce479bfd9069c9fa96b77b7a0e6 Mon Sep 17 00:00:00 2001
From: Wang Xinyu <wangxinyu_es@163.com>
Date: Mon, 19 Dec 2022 10:14:17 +0800
Subject: [PATCH 75/77] [Streamer] Basic framework, YAML parser, ppyoloe demo
 and video decoder demo (#863)

* support trt installed in sys dir

* streamer init

* link elements and run

* create source bin

* add config

* restruct dirs

* set property

* link elements

* integrate perf

* add bbox parser

* parse yaml to string, video decoder

* use try pull for decoder and nits

* streamer ppyoloe cpp

* update readme

* video decoder cpp dir

* add cn readme

* update readme

* cmake nits

* refactor perf measurement
---
 CMakeLists.txt                                |  20 ++-
 FastDeploy.cmake.in                           |  19 ++-
 streamer/CMakeLists.txt                       |  52 +++++++
 streamer/README.md                            |   1 +
 streamer/README_CN.md                         |  45 ++++++
 streamer/README_EN.md                         |  44 ++++++
 streamer/examples/ppyoloe/cpp/CMakeLists.txt  |  30 ++++
 streamer/examples/ppyoloe/cpp/README.md       |   1 +
 streamer/examples/ppyoloe/cpp/README_CN.md    |  44 ++++++
 streamer/examples/ppyoloe/cpp/README_EN.md    |  44 ++++++
 streamer/examples/ppyoloe/cpp/main.cc         |  22 +++
 .../examples/ppyoloe/cpp/nvinfer_config.txt   |  23 +++
 .../examples/ppyoloe/cpp/streamer_cfg.yml     |  46 ++++++
 .../examples/video_decoder/cpp/CMakeLists.txt |  30 ++++
 streamer/examples/video_decoder/cpp/README.md |   1 +
 .../examples/video_decoder/cpp/README_CN.md   |  20 +++
 .../examples/video_decoder/cpp/README_EN.md   |  20 +++
 streamer/examples/video_decoder/cpp/main.cc   |  43 ++++++
 .../video_decoder/cpp/streamer_cfg.yml        |  19 +++
 streamer/src/app/base_app.cc                  | 135 +++++++++++++++++
 streamer/src/app/base_app.h                   |  86 +++++++++++
 streamer/src/app/video_analytics.cc           |  21 +++
 streamer/src/app/video_analytics.h            |  33 ++++
 streamer/src/app/video_decoder.cc             |  69 +++++++++
 streamer/src/app/video_decoder.h              |  41 +++++
 streamer/src/app/yaml_parser.cc               | 125 ++++++++++++++++
 streamer/src/app/yaml_parser.h                |  58 +++++++
 streamer/src/deepstream/bbox_parser.cc        |  76 ++++++++++
 streamer/src/fd_streamer.cc                   |  56 +++++++
 streamer/src/fd_streamer.h                    |  52 +++++++
 streamer/src/gstreamer/perf.cc                | 114 ++++++++++++++
 streamer/src/gstreamer/perf.h                 |  29 ++++
 streamer/src/gstreamer/types.h                |  60 ++++++++
 streamer/src/gstreamer/utils.cc               | 141 ++++++++++++++++++
 streamer/src/gstreamer/utils.h                |  28 ++++
 35 files changed, 1635 insertions(+), 13 deletions(-)
 create mode 100644 streamer/CMakeLists.txt
 create mode 120000 streamer/README.md
 create mode 100644 streamer/README_CN.md
 create mode 100644 streamer/README_EN.md
 create mode 100644 streamer/examples/ppyoloe/cpp/CMakeLists.txt
 create mode 120000 streamer/examples/ppyoloe/cpp/README.md
 create mode 100644 streamer/examples/ppyoloe/cpp/README_CN.md
 create mode 100644 streamer/examples/ppyoloe/cpp/README_EN.md
 create mode 100644 streamer/examples/ppyoloe/cpp/main.cc
 create mode 100644 streamer/examples/ppyoloe/cpp/nvinfer_config.txt
 create mode 100644 streamer/examples/ppyoloe/cpp/streamer_cfg.yml
 create mode 100644 streamer/examples/video_decoder/cpp/CMakeLists.txt
 create mode 120000 streamer/examples/video_decoder/cpp/README.md
 create mode 100644 streamer/examples/video_decoder/cpp/README_CN.md
 create mode 100644 streamer/examples/video_decoder/cpp/README_EN.md
 create mode 100644 streamer/examples/video_decoder/cpp/main.cc
 create mode 100644 streamer/examples/video_decoder/cpp/streamer_cfg.yml
 create mode 100644 streamer/src/app/base_app.cc
 create mode 100644 streamer/src/app/base_app.h
 create mode 100644 streamer/src/app/video_analytics.cc
 create mode 100644 streamer/src/app/video_analytics.h
 create mode 100644 streamer/src/app/video_decoder.cc
 create mode 100644 streamer/src/app/video_decoder.h
 create mode 100644 streamer/src/app/yaml_parser.cc
 create mode 100644 streamer/src/app/yaml_parser.h
 create mode 100644 streamer/src/deepstream/bbox_parser.cc
 create mode 100644 streamer/src/fd_streamer.cc
 create mode 100644 streamer/src/fd_streamer.h
 create mode 100644 streamer/src/gstreamer/perf.cc
 create mode 100644 streamer/src/gstreamer/perf.h
 create mode 100644 streamer/src/gstreamer/types.h
 create mode 100644 streamer/src/gstreamer/utils.cc
 create mode 100644 streamer/src/gstreamer/utils.h

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 0bcfa4084..04954acb1 100755
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -362,14 +362,20 @@ if(ENABLE_TRT_BACKEND)
   endif()
   if(NOT BUILD_ON_JETSON)
     if(NOT TRT_DIRECTORY)
-      message(FATAL_ERROR "While -DENABLE_TRT_BACKEND=ON, must define -DTRT_DIRECTORY, e.g -DTRT_DIRECTORY=/Downloads/TensorRT-8.4")
+      set(TRT_INC_DIR /usr/include/x86_64-linux-gnu/)
+      set(TRT_LIB_DIR /usr/lib/x86_64-linux-gnu/)
     endif()
   endif()
-  set(TRT_INC_DIR /usr/include/aarch64-linux-gnu/)
-  set(TRT_LIB_DIR /usr/lib/aarch64-linux-gnu/)
-  if(NOT BUILD_ON_JETSON)
-    set(TRT_INC_DIR ${TRT_DIRECTORY}/include)
-    set(TRT_LIB_DIR ${TRT_DIRECTORY}/lib)
+  if(BUILD_ON_JETSON)
+    set(TRT_INC_DIR /usr/include/aarch64-linux-gnu/)
+    set(TRT_LIB_DIR /usr/lib/aarch64-linux-gnu/)
+  else()
+    set(TRT_INC_DIR /usr/include/x86_64-linux-gnu/)
+    set(TRT_LIB_DIR /usr/lib/x86_64-linux-gnu/)
+    if(TRT_DIRECTORY)
+      set(TRT_INC_DIR ${TRT_DIRECTORY}/include)
+      set(TRT_LIB_DIR ${TRT_DIRECTORY}/lib)
+    endif()
   endif()
 
   add_definitions(-DENABLE_TRT_BACKEND)
@@ -382,7 +388,7 @@ if(ENABLE_TRT_BACKEND)
   list(APPEND DEPEND_LIBS ${TRT_INFER_LIB} ${TRT_ONNX_LIB} ${TRT_PLUGIN_LIB})
   list(APPEND ALL_DEPLOY_SRCS ${DEPLOY_OP_CUDA_KERNEL_SRCS})
 
-  if(NOT BUILD_ON_JETSON)
+  if(NOT BUILD_ON_JETSON AND TRT_DIRECTORY)
     if(NOT EXISTS "${CMAKE_CURRENT_BINARY_DIR}/third_libs/install/tensorrt")
       file(MAKE_DIRECTORY "${CMAKE_CURRENT_BINARY_DIR}/third_libs/install/tensorrt")
     endif()
diff --git a/FastDeploy.cmake.in b/FastDeploy.cmake.in
index d8c0df3d6..17f83eb69 100755
--- a/FastDeploy.cmake.in
+++ b/FastDeploy.cmake.in
@@ -141,13 +141,19 @@ if(WITH_GPU)
 
   if (ENABLE_TRT_BACKEND)
     if(BUILD_ON_JETSON)
-      find_library(TRT_INFER_LIB nvinfer /usr/include/aarch64-linux-gnu/)
-      find_library(TRT_ONNX_LIB nvonnxparser /usr/include/aarch64-linux-gnu/)
-      find_library(TRT_PLUGIN_LIB nvinfer_plugin /usr/include/aarch64-linux-gnu/)
+      find_library(TRT_INFER_LIB nvinfer /usr/lib/aarch64-linux-gnu/)
+      find_library(TRT_ONNX_LIB nvonnxparser /usr/lib/aarch64-linux-gnu/)
+      find_library(TRT_PLUGIN_LIB nvinfer_plugin /usr/lib/aarch64-linux-gnu/)
     else()
-      find_library(TRT_INFER_LIB nvinfer ${CMAKE_CURRENT_LIST_DIR}/third_libs/install/tensorrt/lib NO_DEFAULT_PATH)
-      find_library(TRT_ONNX_LIB nvonnxparser ${CMAKE_CURRENT_LIST_DIR}/third_libs/install/tensorrt/lib NO_DEFAULT_PATH)
-      find_library(TRT_PLUGIN_LIB nvinfer_plugin ${CMAKE_CURRENT_LIST_DIR}/third_libs/install/tensorrt/lib NO_DEFAULT_PATH)
+      if(TRT_DIRECTORY)
+        find_library(TRT_INFER_LIB nvinfer ${CMAKE_CURRENT_LIST_DIR}/third_libs/install/tensorrt/lib NO_DEFAULT_PATH)
+        find_library(TRT_ONNX_LIB nvonnxparser ${CMAKE_CURRENT_LIST_DIR}/third_libs/install/tensorrt/lib NO_DEFAULT_PATH)
+        find_library(TRT_PLUGIN_LIB nvinfer_plugin ${CMAKE_CURRENT_LIST_DIR}/third_libs/install/tensorrt/lib NO_DEFAULT_PATH)
+      else()
+        find_library(TRT_INFER_LIB nvinfer /usr/lib/x86_64-linux-gnu/)
+        find_library(TRT_ONNX_LIB nvonnxparser /usr/lib/x86_64-linux-gnu/)
+        find_library(TRT_PLUGIN_LIB nvinfer_plugin /usr/lib/x86_64-linux-gnu/)
+      endif()
     endif()
     list(APPEND FASTDEPLOY_LIBS ${TRT_INFER_LIB} ${TRT_ONNX_LIB} ${TRT_PLUGIN_LIB})
   endif()
@@ -275,6 +281,7 @@ message(STATUS "  ENABLE_VISION             : ${ENABLE_VISION}")
 message(STATUS "  ENABLE_TEXT               : ${ENABLE_TEXT}")
 if(WITH_GPU)
   message(STATUS "  CUDA_DIRECTORY            : ${CUDA_DIRECTORY}")
+  message(STATUS "  TRT_DIRECTORY             : ${TRT_DIRECTORY}")
 endif()
 if(OPENCV_DIRECTORY)
   message(STATUS "  OPENCV_DIRECTORY          : ${OPENCV_DIRECTORY}")
diff --git a/streamer/CMakeLists.txt b/streamer/CMakeLists.txt
new file mode 100644
index 000000000..c5c7c2bd8
--- /dev/null
+++ b/streamer/CMakeLists.txt
@@ -0,0 +1,52 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+PROJECT(fd_streamer C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+option(ENABLE_DEEPSTREAM "Enable NVIDIA DeepStream SDK" ON)
+
+file(GLOB_RECURSE ALL_STREAMER_SRCS ${PROJECT_SOURCE_DIR}/src/*.cc)
+file(GLOB_RECURSE DEEPSTREAM_SRCS ${PROJECT_SOURCE_DIR}/src/deepstream/*.cc)
+list(REMOVE_ITEM ALL_STREAMER_SRCS ${DEEPSTREAM_SRCS})
+
+set(DEPEND_LIBS "")
+
+find_package(PkgConfig REQUIRED)
+pkg_check_modules(GSTAPP gstreamer-app-1.0 REQUIRED)
+include_directories(${GSTAPP_INCLUDE_DIRS})
+list(APPEND DEPEND_LIBS ${GSTAPP_LIBRARIES})
+
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+include_directories(${FASTDEPLOY_INCS})
+include_directories(${PROJECT_SOURCE_DIR}/src/)
+
+if(ENABLE_DEEPSTREAM)
+  add_definitions(-DENABLE_DEEPSTREAM)
+  include_directories(${CUDA_DIRECTORY}/include)
+  include_directories(/opt/nvidia/deepstream/deepstream/sources/includes/)
+  link_directories(/opt/nvidia/deepstream/deepstream/lib/)
+  list(APPEND ALL_STREAMER_SRCS ${DEEPSTREAM_SRCS})
+  list(APPEND DEPEND_LIBS nvdsgst_meta nvds_meta)
+else()
+  message(FATAL_ERROR "Currently, DeepStream is required, we will make it optional later.")
+endif()
+
+# Link the yaml-cpp in system path, because deepstream also depends on yaml-cpp,
+# If we link multiple yaml-cpp libs, strange error will occur.
+list(APPEND DEPEND_LIBS yaml-cpp)
+
+add_library(fd_streamer SHARED ${ALL_STREAMER_SRCS})
+target_link_libraries(fd_streamer ${FASTDEPLOY_LIBS} ${DEPEND_LIBS})
diff --git a/streamer/README.md b/streamer/README.md
new file mode 120000
index 000000000..f18766817
--- /dev/null
+++ b/streamer/README.md
@@ -0,0 +1 @@
+README_EN.md
\ No newline at end of file
diff --git a/streamer/README_CN.md b/streamer/README_CN.md
new file mode 100644
index 000000000..fcf40bf6e
--- /dev/null
+++ b/streamer/README_CN.md
@@ -0,0 +1,45 @@
+简体中文 | [English](README_EN.md)
+
+# FastDeploy Streamer
+
+## 简介
+
+FastDeploy Streamer（FDStreamer）是一个AI多媒体流处理框架，以Pipeline的形式编排AI推理、音视频解码、编码、推流等功能，
+赋能AI应用的端到端优化和部署。
+
+目前FDStreamer只适配了NVIDIA GPU/Jetson平台，更多硬件和平台的支持敬请期待。
+
+## 准备环境
+
+### Jetson
+- DeepStream 6.1+
+
+### x86 GPU
+
+手动安装DeepStream 6.1.1及其依赖项，或使用以下docker：
+```
+docker pull nvcr.io/nvidia/deepstream:6.1.1-devel
+```
+
+## 编译和运行
+
+1. [编译FastDeploy](../../docs/cn/build_and_install), 或直接下载[FastDeploy预编译库](../../docs/cn/build_and_install/download_prebuilt_libraries.md)
+
+2. 编译Streamer
+```
+cd FastDeploy/streamer/
+mkdir build && cd build/
+
+# 下载FastDeploy预编译库，用户可在上文提到的`FastDeploy预编译库`中自行选择合适的版本使用
+wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz
+tar xvf fastdeploy-linux-x64-x.x.x.tgz
+cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
+make -j
+```
+
+3. 编译和运行Example
+
+| Example | 简介 |
+|:--|:--|
+| [PP-YOLOE](./examples/ppyoloe) | 多路视频接入，PP-YOLOE目标检测，NVTracker跟踪，硬编解码，写入mp4文件 |
+| [Video Decoder](./examples/video_decoder) | 视频硬解码 |  
diff --git a/streamer/README_EN.md b/streamer/README_EN.md
new file mode 100644
index 000000000..16aea26c9
--- /dev/null
+++ b/streamer/README_EN.md
@@ -0,0 +1,44 @@
+English | [简体中文](README_CN.md)
+
+# FastDeploy Streamer
+
+## Introduction
+
+FastDeploy Streamer (FDStreamer) is an AI multimedia stream processing framework that arranges functions such as AI inference, audio and video decoding, encoding, and streaming in the form of pipeline, to enable end-to-end optimization and deployment of AI applications.
+
+Currently FDStreamer is only compatible with NVIDIA GPU/Jetson platform, please look forward to more hardware and platform support.
+
+## Environment
+
+### Jetson
+- DeepStream 6.1+
+
+### x86 GPU
+
+Install DeepStream 6.1.1 and dependencies manually，or use below docker：
+```
+docker pull nvcr.io/nvidia/deepstream:6.1.1-devel
+```
+
+## Build
+
+1. [Build FastDeploy](../../docs/en/build_and_install), or download [FastDeploy prebuilt libraries](../../docs/en/build_and_install/download_prebuilt_libraries.md)
+
+2. Build Streamer
+```
+cd FastDeploy/streamer/
+mkdir build && cd build/
+
+# Download FastDeploy prebuilt libraries, please check `FastDeploy prebuilt libraries` above.
+wget https://bj.bcebos.com/fastdeploy/release/cpp/fastdeploy-linux-x64-x.x.x.tgz
+tar xvf fastdeploy-linux-x64-x.x.x.tgz
+cmake .. -DFASTDEPLOY_INSTALL_DIR=${PWD}/fastdeploy-linux-x64-x.x.x
+make -j
+```
+
+3. Build and Run Example
+
+| Example | Brief |
+|:--|:--|
+| [PP-YOLOE](./examples/ppyoloe) | Multiple input videos, PP-YOLOE object detection, NvTracker, Hardware codec, writing to mp4 file |
+| [Video Decoder](./examples/video_decoder) | Video decoding using hardward |  
diff --git a/streamer/examples/ppyoloe/cpp/CMakeLists.txt b/streamer/examples/ppyoloe/cpp/CMakeLists.txt
new file mode 100644
index 000000000..7cd3b2be3
--- /dev/null
+++ b/streamer/examples/ppyoloe/cpp/CMakeLists.txt
@@ -0,0 +1,30 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+PROJECT(streamer_ppyoloe C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+include_directories(${FASTDEPLOY_INCS})
+
+set(FDSTREAMER_INCLUDE_DIR ${PROJECT_SOURCE_DIR}/../../../src/)
+include_directories(${FDSTREAMER_INCLUDE_DIR})
+link_directories(${PROJECT_SOURCE_DIR}/../../../build/)
+
+find_package(PkgConfig REQUIRED)
+pkg_check_modules(GSTAPP gstreamer-app-1.0 REQUIRED)
+include_directories(${GSTAPP_INCLUDE_DIRS})
+
+add_executable(streamer_demo main.cc)
+target_link_libraries(streamer_demo fd_streamer)
diff --git a/streamer/examples/ppyoloe/cpp/README.md b/streamer/examples/ppyoloe/cpp/README.md
new file mode 120000
index 000000000..f18766817
--- /dev/null
+++ b/streamer/examples/ppyoloe/cpp/README.md
@@ -0,0 +1 @@
+README_EN.md
\ No newline at end of file
diff --git a/streamer/examples/ppyoloe/cpp/README_CN.md b/streamer/examples/ppyoloe/cpp/README_CN.md
new file mode 100644
index 000000000..7305edfee
--- /dev/null
+++ b/streamer/examples/ppyoloe/cpp/README_CN.md
@@ -0,0 +1,44 @@
+简体中文 | [English](README_EN.md)
+
+# FastDeploy Streamer PP-YOLOE C++ Example
+
+## 编译和运行
+
+1. 需要先FastDeploy Streamer, 请参考[README](../../../README.md)
+
+2. 编译Example
+```
+mkdir build && cd build
+cmake .. -DFASTDEPLOY_INSTALL_DIR=[PATH-OF-FASTDEPLOY-INSTALL-DIR]
+make -j
+```
+
+3. 下载模型
+```
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco_onnx_without_scale_factor.tgz
+tar xvf ppyoloe_crn_l_300e_coco_onnx_without_scale_factor.tgz
+mv ppyoloe_crn_l_300e_coco_onnx_without_scale_factor/ model/
+```
+
+4. 运行
+```
+cp ../nvinfer_config.txt .
+cp ../streamer_cfg.yml .
+./streamer_demo
+```
+
+## 导出ONNX模型，不包含NMS和scale factor
+```
+# 导出Paddle推理模型，exclude_nms=True and trt=True
+git clone https://github.com/PaddlePaddle/PaddleDetection.git
+cd PaddleDetection
+python tools/export_model.py -c configs/ppyoloe/ppyoloe_crn_l_300e_coco.yml -o  weights=https://paddledet.bj.bcebos.com/models/ppyoloe_crn_l_300e_coco.pdparams exclude_nms=True trt=True --output_dir inference_model
+
+# 转换为ONNX
+paddle2onnx --model_dir inference_model/ppyoloe_crn_l_300e_coco/  --model_filename model.pdmodel  --params_filename model.pdiparams  --save_file ppyoloe.onnx  --deploy_backend tensorrt  --enable_dev_version True
+
+# 裁剪ONNX，删除scale factor
+git clone https://github.com/PaddlePaddle/Paddle2ONNX.git
+cd Paddle2ONNX
+python tools/onnx/prune_onnx_model.py --model ../PaddleDetection/ppyoloe.onnx --output_names concat_14.tmp_0 p2o.Mul.245 --save_file ppyoloe_without_scale_factor.onnx
+```
diff --git a/streamer/examples/ppyoloe/cpp/README_EN.md b/streamer/examples/ppyoloe/cpp/README_EN.md
new file mode 100644
index 000000000..192bab502
--- /dev/null
+++ b/streamer/examples/ppyoloe/cpp/README_EN.md
@@ -0,0 +1,44 @@
+English | [简体中文](README_CN.md)
+
+# FastDeploy Streamer PP-YOLOE C++ Example
+
+## Build and Run
+
+1. Build FastDeploy Streamer first, [README](../../../README.md)
+
+2. Build Example
+```
+mkdir build && cd build
+cmake .. -DFASTDEPLOY_INSTALL_DIR=[PATH-OF-FASTDEPLOY-INSTALL-DIR]
+make -j
+```
+
+3. Download model
+```
+wget https://bj.bcebos.com/paddlehub/fastdeploy/ppyoloe_crn_l_300e_coco_onnx_without_scale_factor.tgz
+tar xvf ppyoloe_crn_l_300e_coco_onnx_without_scale_factor.tgz
+mv ppyoloe_crn_l_300e_coco_onnx_without_scale_factor/ model/
+```
+
+4. Run
+```
+cp ../nvinfer_config.txt .
+cp ../streamer_cfg.yml .
+./streamer_demo
+```
+
+## Export ONNX excluding scale_factor and NMS
+```
+# Export inference model with exclude_nms=True and trt=True
+git clone https://github.com/PaddlePaddle/PaddleDetection.git
+cd PaddleDetection
+python tools/export_model.py -c configs/ppyoloe/ppyoloe_crn_l_300e_coco.yml -o  weights=https://paddledet.bj.bcebos.com/models/ppyoloe_crn_l_300e_coco.pdparams exclude_nms=True trt=True --output_dir inference_model
+
+# Convert to ONNX
+paddle2onnx --model_dir inference_model/ppyoloe_crn_l_300e_coco/  --model_filename model.pdmodel  --params_filename model.pdiparams  --save_file ppyoloe.onnx  --deploy_backend tensorrt  --enable_dev_version True
+
+# Prune ONNX to delete scale factor
+git clone https://github.com/PaddlePaddle/Paddle2ONNX.git
+cd Paddle2ONNX
+python tools/onnx/prune_onnx_model.py --model ../PaddleDetection/ppyoloe.onnx --output_names concat_14.tmp_0 p2o.Mul.245 --save_file ppyoloe_without_scale_factor.onnx
+```
diff --git a/streamer/examples/ppyoloe/cpp/main.cc b/streamer/examples/ppyoloe/cpp/main.cc
new file mode 100644
index 000000000..5e9a8c9ff
--- /dev/null
+++ b/streamer/examples/ppyoloe/cpp/main.cc
@@ -0,0 +1,22 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fd_streamer.h"
+
+int main(int argc, char* argv[]) {
+  auto streamer = fastdeploy::streamer::FDStreamer();
+  streamer.Init("streamer_cfg.yml");
+  streamer.Run();
+  return 0;
+}
diff --git a/streamer/examples/ppyoloe/cpp/nvinfer_config.txt b/streamer/examples/ppyoloe/cpp/nvinfer_config.txt
new file mode 100644
index 000000000..c0a481f5c
--- /dev/null
+++ b/streamer/examples/ppyoloe/cpp/nvinfer_config.txt
@@ -0,0 +1,23 @@
+[property]
+batch-size=4
+net-scale-factor=0.0039215697906911373
+# 0=RGB, 1=BGR
+model-color-format=0
+onnx-file=model/ppyoloe.onnx
+model-engine-file=model/ppyoloe.onnx_b4_gpu0_fp32.engine
+labelfile-path=model/labels.txt
+## 0=FP32, 1=INT8, 2=FP16 mode
+network-mode=0
+num-detected-classes=80
+gie-unique-id=1
+network-type=0
+## 1=DBSCAN, 2=NMS, 3= DBSCAN+NMS Hybrid, 4 = None(No clustering)
+cluster-mode=2
+maintain-aspect-ratio=1
+parse-bbox-func-name=NvDsInferParseCustomPPYOLOE
+custom-lib-path=../../../../build/libfd_streamer.so
+
+[class-attrs-all]
+nms-iou-threshold=0.45
+pre-cluster-threshold=0.25
+topk=300
diff --git a/streamer/examples/ppyoloe/cpp/streamer_cfg.yml b/streamer/examples/ppyoloe/cpp/streamer_cfg.yml
new file mode 100644
index 000000000..eb62e5959
--- /dev/null
+++ b/streamer/examples/ppyoloe/cpp/streamer_cfg.yml
@@ -0,0 +1,46 @@
+app:
+  type: video_analytics
+  enable-perf-measurement: true
+  perf-measurement-interval-sec: 5
+
+nvurisrcbin_list:
+  uri-list:
+  - file:///opt/nvidia/deepstream/deepstream/samples/streams/sample_ride_bike.mov
+  - file:///opt/nvidia/deepstream/deepstream/samples/streams/sample_ride_bike.mov
+  - file:///opt/nvidia/deepstream/deepstream/samples/streams/sample_ride_bike.mov
+  - file:///opt/nvidia/deepstream/deepstream/samples/streams/sample_ride_bike.mov
+  pad-prefix: mux.sink_
+  gpu-id: 0
+
+nvstreammux:
+  name: mux
+  gpu-id: 0
+  batch-size: 4
+  width: 1920
+  height: 1080
+  batched-push-timeout: 40000  # 40ms
+
+nvinfer:
+  gpu-id: 0
+  config-file-path: nvinfer_config.txt
+
+nvtracker:
+  gpu-id: 0
+  tracker-width: 640
+  tracker-height: 640
+  ll-lib-file: /opt/nvidia/deepstream/deepstream/lib/libnvds_nvmultiobjecttracker.so
+  ll-config-file: /opt/nvidia/deepstream/deepstream/samples/configs/deepstream-app/config_tracker_NvDCF_perf.yml
+  enable-batch-process: true
+
+nvmultistreamtiler:
+  gpu-id: 0
+  rows: 2
+  columns: 2
+
+nvosdbin:
+  gpu-id: 0
+
+nvvideoencfilesinkbin:
+  gpu-id: 0
+  bitrate: 4000
+  output-file: out.mp4
diff --git a/streamer/examples/video_decoder/cpp/CMakeLists.txt b/streamer/examples/video_decoder/cpp/CMakeLists.txt
new file mode 100644
index 000000000..2e551a341
--- /dev/null
+++ b/streamer/examples/video_decoder/cpp/CMakeLists.txt
@@ -0,0 +1,30 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+PROJECT(video_decoder C CXX)
+CMAKE_MINIMUM_REQUIRED (VERSION 3.10)
+
+option(FASTDEPLOY_INSTALL_DIR "Path of downloaded fastdeploy sdk.")
+include(${FASTDEPLOY_INSTALL_DIR}/FastDeploy.cmake)
+include_directories(${FASTDEPLOY_INCS})
+
+set(FDSTREAMER_INCLUDE_DIR ${PROJECT_SOURCE_DIR}/../../../src/)
+include_directories(${FDSTREAMER_INCLUDE_DIR})
+link_directories(${PROJECT_SOURCE_DIR}/../../../build/)
+
+find_package(PkgConfig REQUIRED)
+pkg_check_modules(GSTAPP gstreamer-app-1.0 REQUIRED)
+include_directories(${GSTAPP_INCLUDE_DIRS})
+
+add_executable(video_decoder main.cc)
+target_link_libraries(video_decoder fd_streamer ${FASTDEPLOY_LIBS})
diff --git a/streamer/examples/video_decoder/cpp/README.md b/streamer/examples/video_decoder/cpp/README.md
new file mode 120000
index 000000000..f18766817
--- /dev/null
+++ b/streamer/examples/video_decoder/cpp/README.md
@@ -0,0 +1 @@
+README_EN.md
\ No newline at end of file
diff --git a/streamer/examples/video_decoder/cpp/README_CN.md b/streamer/examples/video_decoder/cpp/README_CN.md
new file mode 100644
index 000000000..1e91e6783
--- /dev/null
+++ b/streamer/examples/video_decoder/cpp/README_CN.md
@@ -0,0 +1,20 @@
+简体中文 | [English](README_EN.md)
+
+# FastDeploy Streamer Video Decoder Example
+
+## 编译和运行
+
+1. 需要先FastDeploy Streamer, 请参考[README](../../../README.md)
+
+2. 编译Example
+```
+mkdir build && cd build
+cmake .. -DFASTDEPLOY_INSTALL_DIR=[PATH-OF-FASTDEPLOY-INSTALL-DIR]
+make -j
+```
+
+3. 运行
+```
+cp ../streamer_cfg.yml .
+./video_decoder
+```
diff --git a/streamer/examples/video_decoder/cpp/README_EN.md b/streamer/examples/video_decoder/cpp/README_EN.md
new file mode 100644
index 000000000..4b6a0905b
--- /dev/null
+++ b/streamer/examples/video_decoder/cpp/README_EN.md
@@ -0,0 +1,20 @@
+English | [简体中文](README_CN.md)
+
+# FastDeploy Streamer Video Decoder Example
+
+## Build and Run
+
+1. Build FastDeploy Streamer first, [README](../../../README.md)
+
+2. Build Example
+```
+mkdir build && cd build
+cmake .. -DFASTDEPLOY_INSTALL_DIR=[PATH-OF-FASTDEPLOY-INSTALL-DIR]
+make -j
+```
+
+3. Run
+```
+cp ../streamer_cfg.yml .
+./video_decoder
+```
diff --git a/streamer/examples/video_decoder/cpp/main.cc b/streamer/examples/video_decoder/cpp/main.cc
new file mode 100644
index 000000000..0b3d3435e
--- /dev/null
+++ b/streamer/examples/video_decoder/cpp/main.cc
@@ -0,0 +1,43 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fd_streamer.h"
+#include "fastdeploy/utils/perf.h"
+#include <opencv2/opencv.hpp>
+
+int main(int argc, char* argv[]) {
+  auto streamer = fastdeploy::streamer::FDStreamer();
+  streamer.Init("streamer_cfg.yml");
+  streamer.RunAsync();
+  int count = 0;
+  fastdeploy::FDTensor tensor;
+  fastdeploy::TimeCounter tc;
+  tc.Start();
+  while (1) {
+    bool ret = streamer.TryPullFrame(tensor);
+    if (!ret) {
+      if (streamer.Destroyed()) break;
+      std::this_thread::sleep_for(std::chrono::milliseconds(1));
+      continue;
+    }
+    count++;
+    tensor.PrintInfo();
+    cv::Mat mat(tensor.shape[0], tensor.shape[1], CV_8UC3, tensor.Data());
+    cv::imwrite("out/" + std::to_string(count) + ".jpg", mat);
+  }
+  std::cout << "Total number of frames: " << count << std::endl;
+  tc.End();
+  tc.PrintInfo();
+  return 0;
+}
diff --git a/streamer/examples/video_decoder/cpp/streamer_cfg.yml b/streamer/examples/video_decoder/cpp/streamer_cfg.yml
new file mode 100644
index 000000000..9ab1985fb
--- /dev/null
+++ b/streamer/examples/video_decoder/cpp/streamer_cfg.yml
@@ -0,0 +1,19 @@
+app:
+  type: video_decoder
+  enable-perf-measurement: true
+  perf-measurement-interval-sec: 5
+
+nvurisrcbin:
+  uri: file:///opt/nvidia/deepstream/deepstream/samples/streams/sample_ride_bike.mov
+  gpu-id: 0
+
+nvvideoconvert:
+  gpu-id: 0
+
+capsfilter:
+  caps: video/x-raw,format=(string)BGR
+
+appsink:
+  sync: true
+  max-buffers: 60
+  drop: false
diff --git a/streamer/src/app/base_app.cc b/streamer/src/app/base_app.cc
new file mode 100644
index 000000000..dee7c1929
--- /dev/null
+++ b/streamer/src/app/base_app.cc
@@ -0,0 +1,135 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "app/base_app.h"
+#include "app/yaml_parser.h"
+#include "gstreamer/utils.h"
+#include "gstreamer/perf.h"
+
+namespace fastdeploy {
+namespace streamer {
+
+static GMutex fps_lock;
+
+static gboolean bus_watch_callback(GstBus* bus, GstMessage* msg, gpointer data) {
+  GMainLoop* loop = (GMainLoop*)data;
+  switch (GST_MESSAGE_TYPE(msg)) {
+    case GST_MESSAGE_EOS:
+      g_print("End of stream\n");
+      g_main_loop_quit(loop);
+      break;
+    case GST_MESSAGE_ERROR: {
+      gchar* debug;
+      GError* error;
+      gst_message_parse_error(msg, &error, &debug);
+      g_printerr("ERROR from element %s: %s\n",
+          GST_OBJECT_NAME(msg->src), error->message);
+      if (debug)
+        g_printerr("Error details: %s\n", debug);
+      g_free(debug);
+      g_error_free(error);
+      g_main_loop_quit(loop);
+      break;
+    }
+    default:
+      break;
+  }
+  return TRUE;
+}
+
+static void PerfCallbackFunc(gpointer context, PerfResult* perf) {
+  g_mutex_lock(&fps_lock);
+  std::cout << "FPS: " << perf->fps
+            << ", total avg.: " << perf->fps_avg << std::endl;
+  g_mutex_unlock(&fps_lock);
+}
+
+bool BaseApp::Init(const std::string& config_file) {
+  gst_init(NULL, NULL);
+  loop_ = g_main_loop_new(NULL, FALSE);
+
+  YamlParser parser(config_file);
+  pipeline_ = parser.BuildPipelineFromConfig();
+
+  GstBus* bus = gst_pipeline_get_bus(GST_PIPELINE(pipeline_));
+  bus_watch_id_ = gst_bus_add_watch(bus, bus_watch_callback, loop_);
+  gst_object_unref(bus);
+
+  SetupPerfMeasurement();
+  return true;
+}
+
+bool BaseApp::Run() {
+  gst_element_set_state(pipeline_, GST_STATE_PLAYING);
+
+  /* Wait till pipeline encounters an error or EOS */
+  g_print("Running...\n");
+  g_main_loop_run(loop_);
+
+  Destroy();
+  return true;
+}
+
+static void MainLoopThread(BaseApp* app) {
+  g_main_loop_run(app->GetLoop());
+  app->Destroy();
+}
+
+bool BaseApp::RunAsync() {
+  gst_element_set_state(pipeline_, GST_STATE_PLAYING);
+  g_print("Running Asynchronous...\n");
+  // std::thread t(MainLoopThread, this);
+  // thread_ = std::move(t);
+  std::future<void> fut = std::async(std::launch::async, MainLoopThread, this);
+  future_ = std::move(fut);
+  return true;
+}
+
+void BaseApp::SetupPerfMeasurement() {
+  if (!app_config_.enable_perf_measurement) return;
+
+  GstElement* elem = NULL;
+  auto elem_names = GetSinkElemNames(GST_BIN(pipeline_));
+  for (auto& elem_name : elem_names) {
+    std::cout << elem_name << std::endl;
+    if (elem_name.find("nvvideoencfilesinkbin") != std::string::npos) {
+      elem = gst_bin_get_by_name(GST_BIN(pipeline_), elem_name.c_str());
+    } else if (elem_name.find("appsink") != std::string::npos) {
+      elem = gst_bin_get_by_name(GST_BIN(pipeline_), elem_name.c_str());
+    }
+  }
+  FDASSERT(elem != NULL, "Can't find a properly sink bin in the pipeline");
+
+  GstPad* perf_pad = gst_element_get_static_pad(elem, "sink");
+  FDASSERT(perf_pad != NULL, "Unable to get sink pad");
+
+  perf_ctx_.user_data = nullptr;
+  EnablePerfMeasurement(&perf_ctx_, perf_pad,
+      (gulong)(app_config_.perf_interval_sec), PerfCallbackFunc);
+
+  gst_object_unref(perf_pad);
+}
+
+void BaseApp::Destroy() {
+  g_print("Returned, stopping playback\n");
+  gst_element_set_state(pipeline_, GST_STATE_NULL);
+  g_print("Deleting pipeline\n");
+  gst_object_unref(GST_OBJECT(pipeline_));
+  g_source_remove(bus_watch_id_);
+  g_main_loop_unref(loop_);
+  destroyed_ = true;
+}
+
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/app/base_app.h b/streamer/src/app/base_app.h
new file mode 100644
index 000000000..db1827b5b
--- /dev/null
+++ b/streamer/src/app/base_app.h
@@ -0,0 +1,86 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#pragma once
+
+#include "fastdeploy/utils/utils.h"
+#include "gstreamer/types.h"
+
+#include <gst/gst.h>
+#include <future>  // NOLINT
+
+namespace fastdeploy {
+namespace streamer {
+
+enum AppType {
+  VIDEO_ANALYTICS,  ///< Video analytics app
+  VIDEO_DECODER,  ///< Video decoder app
+};
+
+struct AppConfig {
+  AppType type;
+  bool enable_perf_measurement = false;
+  int perf_interval_sec = 5;
+};
+
+/*! @brief Base App class
+ */
+class BaseApp {
+ public:
+  BaseApp() {}
+  explicit BaseApp(AppConfig& app_config) {
+    app_config_ = app_config;
+  }
+  virtual ~BaseApp() = default;
+
+  virtual bool Init(const std::string& config_file);
+
+  bool Run();
+
+  bool RunAsync();
+
+  void Destroy();
+
+  void SetupPerfMeasurement();
+
+  AppConfig* GetAppConfig() {
+    return &app_config_;
+  }
+
+  GstElement* GetPipeline() {
+    return pipeline_;
+  }
+
+  GMainLoop* GetLoop() {
+    return loop_;
+  }
+
+  guint GetBusId() {
+    return bus_watch_id_;
+  }
+
+  bool Destroyed() {
+    return destroyed_;
+  }
+
+ protected:
+  AppConfig app_config_;
+  GstElement* pipeline_;
+  GMainLoop* loop_;
+  guint bus_watch_id_;
+  PerfContext perf_ctx_;
+  std::future<void> future_;
+  bool destroyed_ = false;
+};
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/app/video_analytics.cc b/streamer/src/app/video_analytics.cc
new file mode 100644
index 000000000..54b5e7ae1
--- /dev/null
+++ b/streamer/src/app/video_analytics.cc
@@ -0,0 +1,21 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "app/video_analytics.h"
+
+namespace fastdeploy {
+namespace streamer {
+
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/app/video_analytics.h b/streamer/src/app/video_analytics.h
new file mode 100644
index 000000000..e256be4b7
--- /dev/null
+++ b/streamer/src/app/video_analytics.h
@@ -0,0 +1,33 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#pragma once
+
+#include "app/base_app.h"
+#include "fastdeploy/utils/utils.h"
+
+#include <gst/gst.h>
+
+namespace fastdeploy {
+namespace streamer {
+
+/*! @brief VideoAnalyticsApp class
+ */
+class FASTDEPLOY_DECL VideoAnalyticsApp : public BaseApp {
+ public:
+  explicit VideoAnalyticsApp(AppConfig& app_config) : BaseApp(app_config) {}
+
+ private:
+};
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/app/video_decoder.cc b/streamer/src/app/video_decoder.cc
new file mode 100644
index 000000000..7c11e7dd9
--- /dev/null
+++ b/streamer/src/app/video_decoder.cc
@@ -0,0 +1,69 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "app/video_decoder.h"
+#include "gstreamer/utils.h"
+
+namespace fastdeploy {
+namespace streamer {
+
+bool VideoDecoderApp::Init(const std::string& config_file) {
+  FDINFO << "this " << std::endl;
+  BaseApp::Init(config_file);
+  GetAppsinkFromPipeline();
+  return true;
+}
+
+bool VideoDecoderApp::TryPullFrame(FDTensor& tensor, int timeout_ms) {
+  GstSample* sample = gst_app_sink_try_pull_sample(appsink_,
+                                                   timeout_ms * GST_MSECOND);
+  if (sample == NULL) {
+    return false;
+  }
+  GstCaps* caps = NULL;
+  uint8_t* data = nullptr;
+  Frame frame;
+  do {
+    bool ret = GetFrameFromSample(sample, frame);
+    if (!ret) {
+      FDERROR << "Failed to get buffer from sample." << std::endl;
+      break;
+    }
+    FDASSERT(frame.device == Device::CPU,
+             "Currently, only CPU frame is supported");
+
+    std::vector<int64_t> shape = GetFrameShape(frame);
+    tensor.Resize(shape, FDDataType::UINT8, "", frame.device);
+    FDTensor::CopyBuffer(tensor.Data(), frame.data, tensor.Nbytes(),
+                        tensor.device);
+  } while (false);
+
+  if (sample) gst_sample_unref(sample);
+  return true;
+}
+
+void VideoDecoderApp::GetAppsinkFromPipeline() {
+  GstElement* elem = NULL;
+  auto elem_names = GetSinkElemNames(GST_BIN(pipeline_));
+  for (auto& elem_name : elem_names) {
+    std::cout << elem_name << std::endl;
+    if (elem_name.find("appsink") != std::string::npos) {
+      elem = gst_bin_get_by_name(GST_BIN(pipeline_), elem_name.c_str());
+    }
+  }
+  FDASSERT(elem != NULL, "Can't find a appsink in the pipeline");
+  appsink_ = GST_APP_SINK_CAST(elem);
+}
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/app/video_decoder.h b/streamer/src/app/video_decoder.h
new file mode 100644
index 000000000..1bab3e7d6
--- /dev/null
+++ b/streamer/src/app/video_decoder.h
@@ -0,0 +1,41 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#pragma once
+
+#include "app/base_app.h"
+#include "fastdeploy/utils/utils.h"
+#include "fastdeploy/core/fd_tensor.h"
+
+#include <gst/gst.h>
+#include <gst/app/gstappsink.h>
+
+namespace fastdeploy {
+namespace streamer {
+
+/*! @brief VideoDecoderApp class
+ */
+class FASTDEPLOY_DECL VideoDecoderApp : public BaseApp {
+ public:
+  explicit VideoDecoderApp(AppConfig& app_config) : BaseApp(app_config) {}
+
+  bool Init(const std::string& config_file);
+
+  bool TryPullFrame(FDTensor& tensor, int timeout_ms);
+
+ private:
+  void GetAppsinkFromPipeline();
+  GstAppSink* appsink_;
+};
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/app/yaml_parser.cc b/streamer/src/app/yaml_parser.cc
new file mode 100644
index 000000000..92c385777
--- /dev/null
+++ b/streamer/src/app/yaml_parser.cc
@@ -0,0 +1,125 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "app/yaml_parser.h"
+#include "gstreamer/utils.h"
+
+namespace fastdeploy {
+namespace streamer {
+
+YamlParser::YamlParser(const std::string& config_file) {
+  try {
+    yaml_config_ = YAML::LoadFile(config_file);
+  } catch (YAML::BadFile& e) {
+    FDERROR << "Failed to load yaml file " << config_file
+            << ", maybe you should check this file." << std::endl;
+  }
+  config_file_ = config_file;
+}
+
+void YamlParser::ParseAppConfg(AppConfig& app_config) {
+  ValidateConfig();
+  auto elem = yaml_config_["app"];
+
+  auto type_str = elem["type"].as<std::string>();
+  if (type_str == "video_analytics") {
+    app_config.type = AppType::VIDEO_ANALYTICS;
+  } else if (type_str == "video_decoder") {
+    app_config.type = AppType::VIDEO_DECODER;
+  } else {
+    FDASSERT(false, "Unsupported app type: %s.", type_str.c_str());
+  }
+
+  app_config.enable_perf_measurement = elem["enable-perf-measurement"].as<bool>();
+  if (app_config.enable_perf_measurement) {
+    app_config.perf_interval_sec = elem["perf-measurement-interval-sec"].as<int>();
+  }
+  app_config_ = app_config;
+}
+
+void YamlParser::ValidateConfig() {
+  auto first_elem = yaml_config_.begin()->first.as<std::string>();
+  if (first_elem != "app") {
+    FDASSERT(false, "First config element must be app, but got %s.",
+             first_elem.c_str());
+  }
+}
+
+GstElement* YamlParser::BuildPipelineFromConfig() {
+  auto pipeline_desc = YamlToPipelineDescStr();
+  pipeline_ = CreatePipeline(pipeline_desc);
+  return pipeline_;
+}
+
+std::string YamlParser::YamlToPipelineDescStr() {
+  for (const auto& elem : yaml_config_) {
+    std::string elem_name = elem.first.as<std::string>();
+    std::cout << elem_name << std::endl;
+    ParseElement(elem_name, elem.second);
+  }
+  std::string pipeline_desc = "";
+  for (size_t i = 0; i < elem_descs_.size(); i++) {
+    pipeline_desc += elem_descs_[i];
+    if (elem_descs_[i].find('!') != std::string::npos) continue;
+    if (i >= elem_descs_.size() - 1) continue;
+    pipeline_desc += "! ";
+  }
+  return pipeline_desc;
+}
+
+void YamlParser::ParseElement(const std::string& name, const YAML::Node& properties) {
+  if (name == "app") return;
+
+  if (name == "nvurisrcbin_list") {
+    ParseNvUriSrcBinList(name, properties);
+    return;
+  }
+
+  std::string elem_desc = name + " ";
+  for (auto it = properties.begin(); it != properties.end(); it++) {
+    elem_desc += ParseProperty(it->first, it->second) + " ";
+  }
+  elem_descs_.push_back(elem_desc);
+}
+
+void YamlParser::ParseNvUriSrcBinList(const std::string& name, const YAML::Node& properties) {
+  std::string elem_name = "nvurisrcbin";
+  
+  auto uri_list = properties["uri-list"].as<std::vector<std::string>>();
+  auto pad_prefix = properties["pad-prefix"].as<std::string>();
+  for (size_t i = 0; i < uri_list.size(); i++) {
+    std::string elem_desc = elem_name + " ";
+    elem_desc += "uri=" + uri_list[i] + " ";
+    for (auto it = properties.begin(); it != properties.end(); it++) {
+      auto prop_name = it->first.as<std::string>();
+      if (prop_name == "uri-list" || prop_name == "pad-prefix") continue;
+      elem_desc += ParseProperty(it->first, it->second) + " ";
+    }
+    elem_desc += "! " + pad_prefix + std::to_string(i) + "  ";
+    elem_descs_.push_back(elem_desc);
+  }
+}
+
+std::string YamlParser::ParseProperty(const YAML::Node& name, const YAML::Node& value) {
+  std::string prop_name = name.as<std::string>();
+  std::string prop_value = value.as<std::string>();
+
+  if (prop_name == "_link_to") {
+    return "! " + prop_value + " ";
+  }
+
+  return prop_name + "=" + prop_value;
+}
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/app/yaml_parser.h b/streamer/src/app/yaml_parser.h
new file mode 100644
index 000000000..966a9b623
--- /dev/null
+++ b/streamer/src/app/yaml_parser.h
@@ -0,0 +1,58 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+
+#include "yaml-cpp/yaml.h"
+#include "app/base_app.h"
+#include <gst/gst.h>
+
+namespace fastdeploy {
+namespace streamer {
+
+/*! @brief YAML Parser class, to parse stream configs from yaml file
+ */
+class YamlParser {
+ public:
+  /** \brief Create a YAML parser
+   *
+   * \param[in] config_file Path of configuration file
+   */
+  explicit YamlParser(const std::string& config_file);
+
+  void ParseAppConfg(AppConfig& app_config);
+
+  void ValidateConfig();
+
+  GstElement* BuildPipelineFromConfig();
+
+ private:
+  std::string YamlToPipelineDescStr();
+
+  void ParseElement(const std::string& name, const YAML::Node& properties);
+
+  void ParseNvUriSrcBinList(const std::string& name,
+                            const YAML::Node& properties);
+
+  static std::string ParseProperty(const YAML::Node& name,
+                                   const YAML::Node& value);
+
+  AppConfig app_config_;
+  std::string config_file_;
+  YAML::Node yaml_config_;
+  GstElement* pipeline_;
+  std::vector<std::string> elem_descs_;
+};
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/deepstream/bbox_parser.cc b/streamer/src/deepstream/bbox_parser.cc
new file mode 100644
index 000000000..7a32de40e
--- /dev/null
+++ b/streamer/src/deepstream/bbox_parser.cc
@@ -0,0 +1,76 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "nvdsinfer_custom_impl.h"
+#include <algorithm>
+#include <cassert>
+#include <cmath>
+#include <cstring>
+#include <iostream>
+
+static float clamp(const float val, const float min_val, const float max_val) {
+  assert(min_val <= max_val);
+  return std::min(max_val, std::max(min_val, val));
+}
+
+extern "C" bool NvDsInferParseCustomPPYOLOE(
+    std::vector<NvDsInferLayerInfo> const& outputLayersInfo,
+    NvDsInferNetworkInfo const& networkInfo,
+    NvDsInferParseDetectionParams const& detectionParams,
+    std::vector<NvDsInferParseObjectInfo>& objectList) {
+  if (outputLayersInfo.empty()) {
+    std::cerr << "Could not find output layer in bbox parsing" << std::endl;;
+    return false;
+  }
+
+  int num_classes = outputLayersInfo[0].inferDims.d[0];
+  if (num_classes != detectionParams.numClassesConfigured) {
+    std::cerr << "WARNING: Num classes mismatch. Configured:"
+              << detectionParams.numClassesConfigured
+              << ", detected by network: " << num_classes << std::endl;
+    assert(-1);
+  }
+
+  int num_obj = outputLayersInfo[0].inferDims.d[1];
+  float* score_data = (float*)outputLayersInfo[0].buffer;
+  float* bbox_data = (float*)outputLayersInfo[1].buffer;
+
+  for (int i = 0; i < num_obj; i++) {
+    float max_score = -1.0f;
+    int class_id = -1;
+    for (int j = 0; j < num_classes; j++) {
+      float score = score_data[num_obj * j + i];
+      if (score > max_score) {
+        max_score = score;
+        class_id = j;
+      }
+    }
+    NvDsInferParseObjectInfo obj;
+    obj.classId = (uint32_t)class_id;
+    obj.detectionConfidence = max_score;
+    obj.left = bbox_data[4 * i];
+    obj.top = bbox_data[4 * i + 1];
+    obj.width = bbox_data[4 * i + 2] - bbox_data[4 * i];
+    obj.height = bbox_data[4 * i + 3] - bbox_data[4 * i + 1];
+    obj.left = clamp(obj.left, 0, networkInfo.width);
+    obj.top = clamp(obj.top, 0, networkInfo.height);
+    obj.width = clamp(obj.width, 0, networkInfo.width);
+    obj.height = clamp(obj.height, 0, networkInfo.height);
+    objectList.push_back(obj);
+  }
+  return true;
+}
+
+/* Check that the custom function has been defined correctly */
+CHECK_CUSTOM_PARSE_FUNC_PROTOTYPE(NvDsInferParseCustomPPYOLOE);
diff --git a/streamer/src/fd_streamer.cc b/streamer/src/fd_streamer.cc
new file mode 100644
index 000000000..ecd78a499
--- /dev/null
+++ b/streamer/src/fd_streamer.cc
@@ -0,0 +1,56 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "fd_streamer.h"
+#include "app/yaml_parser.h"
+#include "app/video_analytics.h"
+#include "app/video_decoder.h"
+#include "fastdeploy/utils/unique_ptr.h"
+
+namespace fastdeploy {
+namespace streamer {
+
+bool FDStreamer::Init(const std::string& config_file) {
+  AppConfig app_config;
+  YamlParser parser(config_file);
+  parser.ParseAppConfg(app_config);
+  if (app_config.type == AppType::VIDEO_ANALYTICS) {
+    app_ = utils::make_unique<VideoAnalyticsApp>(app_config);
+    auto casted_app = dynamic_cast<VideoAnalyticsApp*>(app_.get());
+    casted_app->Init(config_file);
+  } else if (app_config.type == AppType::VIDEO_DECODER) {
+    app_ = utils::make_unique<VideoDecoderApp>(app_config);
+    auto casted_app = dynamic_cast<VideoDecoderApp*>(app_.get());
+    casted_app->Init(config_file);
+  } else {
+    FDASSERT(false, "Unsupported app type: %d.", app_config.type);
+  }
+  return true;
+}
+
+bool FDStreamer::Run() {
+  return app_->Run();
+}
+
+bool FDStreamer::RunAsync() {
+  return app_->RunAsync();
+}
+
+bool FDStreamer::TryPullFrame(FDTensor& tensor, int timeout_ms) {
+  auto casted_app = dynamic_cast<VideoDecoderApp*>(app_.get());
+  return casted_app->TryPullFrame(tensor, timeout_ms);
+}
+
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/fd_streamer.h b/streamer/src/fd_streamer.h
new file mode 100644
index 000000000..c5ec40dbf
--- /dev/null
+++ b/streamer/src/fd_streamer.h
@@ -0,0 +1,52 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#pragma once
+
+#include "app/base_app.h"
+#include "fastdeploy/utils/utils.h"
+#include "fastdeploy/core/fd_tensor.h"
+
+#include <memory>
+
+namespace fastdeploy {
+namespace streamer {
+
+/*! @brief FDStreamer class, user inferfaces for FastDeploy Streamer
+ */
+class FASTDEPLOY_DECL FDStreamer {
+ public:
+  /** \brief Init FD streamer
+   *
+   * \param[in] config_file config file path
+   * \return true if the streamer is initialized, otherwise false
+   */
+  bool Init(const std::string& config_file);
+
+  bool Run();
+
+  bool RunAsync();
+
+  void SetupCallback();
+
+  bool TryPullFrame(FDTensor& tensor, int timeout_ms = 1);
+
+  bool Destroyed() {
+    return app_->Destroyed();
+  }
+
+ private:
+  std::unique_ptr<BaseApp> app_;
+};
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/gstreamer/perf.cc b/streamer/src/gstreamer/perf.cc
new file mode 100644
index 000000000..50d0d6994
--- /dev/null
+++ b/streamer/src/gstreamer/perf.cc
@@ -0,0 +1,114 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "gstreamer/perf.h"
+#include <iostream>
+
+namespace fastdeploy {
+namespace streamer {
+
+static GstPadProbeReturn SinkBinBufProbe(GstPad* pad, GstPadProbeInfo* info, gpointer u_data) {
+  PerfContext* ctx = (PerfContext*)u_data;
+  if (ctx->stop) return GST_PAD_PROBE_OK;
+
+  g_mutex_lock(&ctx->lock);
+  if (ctx->buffer_cnt == 0) {
+    ctx->tc.Start();
+  }
+  ctx->tc.End();
+  ctx->buffer_cnt++;
+
+  if (!ctx->first_buffer_arrived) {
+    ctx->total_tc.Start();
+    ctx->first_buffer_arrived = true;
+    std::cout << "The first buffer after resuming arrives." << std::endl;
+  }
+  ctx->total_tc.End();
+  ctx->total_buffer_cnt++;
+  g_mutex_unlock(&ctx->lock);
+  return GST_PAD_PROBE_OK;
+}
+
+static gboolean PerfMeasurementCallback(gpointer data) {
+  PerfContext* ctx = (PerfContext*)data;
+  PerfResult perf_result;
+
+  g_mutex_lock(&ctx->lock);
+  if (ctx->stop) {
+    g_mutex_unlock(&ctx->lock);
+    return FALSE;
+  }
+
+  if (ctx->buffer_cnt < 10) {
+    g_mutex_unlock(&ctx->lock);
+    return TRUE;
+  }
+
+  double duration = ctx->tc.Duration();
+  double total_duration = ctx->total_tc.Duration() + ctx->total_played_duration;
+
+  perf_result.fps = ctx->buffer_cnt / duration;
+  perf_result.fps_avg = ctx->total_buffer_cnt / total_duration;
+  ctx->buffer_cnt = 0;
+  g_mutex_unlock(&ctx->lock);
+
+  ctx->callback(ctx->user_data, &perf_result);
+  return TRUE;
+}
+
+void PausePerfMeasurement(PerfContext* ctx) {
+  g_mutex_lock(&ctx->lock);
+  ctx->stop = true;
+  ctx->total_played_duration += ctx->total_tc.Duration();
+  g_mutex_unlock(&ctx->lock);
+}
+
+void ResumePerfMeasurement(PerfContext* ctx) {
+  g_mutex_lock(&ctx->lock);
+  if (!ctx->stop) {
+    g_mutex_unlock(&ctx->lock);
+    return;
+  }
+
+  ctx->stop = false;
+  ctx->buffer_cnt = 0;
+  ctx->first_buffer_arrived = false;
+  if (!ctx->perf_measurement_timeout_id) {
+    ctx->perf_measurement_timeout_id = g_timeout_add(
+        ctx->measurement_interval_ms, PerfMeasurementCallback, ctx);
+  }
+  g_mutex_unlock(&ctx->lock);
+}
+
+bool EnablePerfMeasurement(PerfContext* ctx, GstPad* sink_bin_pad,
+    gulong interval_sec, PerfCallback callback) {
+  if (!callback) {
+    return false;
+  }
+
+  g_mutex_init(&ctx->lock);
+  ctx->perf_measurement_timeout_id = 0;
+  ctx->measurement_interval_ms = interval_sec * 1000;
+  ctx->callback = callback;
+  ctx->stop = TRUE;
+  ctx->sink_bin_pad = sink_bin_pad;
+  ctx->fps_measure_probe_id = gst_pad_add_probe(sink_bin_pad,
+      GST_PAD_PROBE_TYPE_BUFFER, SinkBinBufProbe, ctx, NULL);
+
+  ResumePerfMeasurement(ctx);
+  return true;
+}
+
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/gstreamer/perf.h b/streamer/src/gstreamer/perf.h
new file mode 100644
index 000000000..7ceb2cd67
--- /dev/null
+++ b/streamer/src/gstreamer/perf.h
@@ -0,0 +1,29 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#pragma once
+
+#include "gstreamer/types.h"
+#include <gst/gst.h>
+
+namespace fastdeploy {
+namespace streamer {
+
+bool EnablePerfMeasurement(PerfContext* ctx, GstPad* sink_bin_pad,
+    gulong interval_sec, PerfCallback callback);
+
+void PausePerfMeasurement(PerfContext* ctx);
+void ResumePerfMeasurement(PerfContext* ctx);
+
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/gstreamer/types.h b/streamer/src/gstreamer/types.h
new file mode 100644
index 000000000..6f6ff68d1
--- /dev/null
+++ b/streamer/src/gstreamer/types.h
@@ -0,0 +1,60 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#pragma once
+
+#include "fastdeploy/core/fd_type.h"
+#include "fastdeploy/utils/perf.h"
+#include <gst/gst.h>
+
+namespace fastdeploy {
+namespace streamer {
+enum PixelFormat {
+  I420,
+  BGR
+};
+
+struct Frame {
+  int width;
+  int height;
+  PixelFormat format;
+  uint8_t* data = nullptr;
+  Device device = Device::CPU;
+};
+
+struct PerfResult {
+  double fps = 0.0;
+  double fps_avg = 0.0;
+};
+
+typedef void (*PerfCallback)(gpointer ctx, PerfResult* str);
+
+struct PerfContext {
+  gulong measurement_interval_ms;
+  gulong perf_measurement_timeout_id;
+  bool stop;
+  gpointer user_data;
+  GMutex lock;
+  PerfCallback callback;
+  GstPad* sink_bin_pad;
+  gulong fps_measure_probe_id;
+  uint64_t buffer_cnt = 0;
+  uint64_t total_buffer_cnt = 0;
+  TimeCounter tc;
+  TimeCounter total_tc;
+  double total_played_duration = 0.0;
+  bool first_buffer_arrived = false;
+};
+
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/gstreamer/utils.cc b/streamer/src/gstreamer/utils.cc
new file mode 100644
index 000000000..21494e30a
--- /dev/null
+++ b/streamer/src/gstreamer/utils.cc
@@ -0,0 +1,141 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "gstreamer/utils.h"
+
+namespace fastdeploy {
+namespace streamer {
+std::string GetElementName(GstElement* elem) {
+  gchar* name = gst_element_get_name(elem);
+  std::string res(name);
+  g_free(name);
+  return res;
+}
+
+std::vector<std::string> GetSinkElemNames(GstBin* bin) {
+  GstIterator *it;
+  GValue val = G_VALUE_INIT;
+  gboolean done = FALSE;
+  std::vector<std::string> names;
+
+  it = gst_bin_iterate_sinks(bin);
+  do {
+    switch (gst_iterator_next(it, &val)) {
+      case GST_ITERATOR_OK: {
+        GstElement* sink = static_cast<GstElement*>(g_value_get_object(&val));
+        names.push_back(GetElementName(sink));
+        g_value_reset(&val);
+        break;
+      }
+      case GST_ITERATOR_RESYNC:
+        gst_iterator_resync(it);
+        break;
+      case GST_ITERATOR_ERROR:
+        GST_ERROR("Error iterating over %s's sink elements",
+            GST_ELEMENT_NAME(bin));
+      case GST_ITERATOR_DONE:
+        g_value_unset(&val);
+        done = TRUE;
+        break;
+    }
+  } while (!done);
+
+  gst_iterator_free(it);
+  return names;
+}
+
+GstElement* CreatePipeline(const std::string& pipeline_desc) {
+  GError *error = NULL;
+  FDINFO << "Trying to launch pipeline: " << pipeline_desc << std::endl;
+  GstElement* pipeline = gst_parse_launch(pipeline_desc.c_str(), &error);
+  FDASSERT(pipeline != NULL, "Failed parse pipeline, error: %s",
+           error->message);
+  return pipeline;
+}
+
+std::vector<int64_t> GetFrameShape(const Frame& frame) {
+  if (frame.format == PixelFormat::I420) {
+    return { frame.height * 3 / 2, frame.width, 1 };
+  } else if (frame.format == PixelFormat::BGR) {
+    return { frame.height, frame.width, 3 };
+  } else {
+    FDASSERT(false, "Unsupported format: %d.", frame.format);
+  }
+}
+
+PixelFormat GetPixelFormat(const std::string& format) {
+  if (format == "I420") {
+    return PixelFormat::I420;
+  } else if (format == "BGR") {
+    return PixelFormat::BGR;
+  } else {
+    FDASSERT(false, "Unsupported format: %s.", format.c_str());
+  }
+}
+
+void GetFrameInfo(GstCaps* caps, Frame& frame) {
+  const GstStructure* struc = gst_caps_get_structure(caps, 0);
+  std::string name = gst_structure_get_name(struc);
+
+  if (name.rfind("video", 0) != 0) {
+    FDASSERT(false, "GetFrameInfo only support video caps.");
+  }
+
+  GstCapsFeatures* features = gst_caps_get_features(caps, 0);
+  if (gst_caps_features_contains(features, "memory:NVMM")) {
+    frame.device = Device::GPU;
+  } else {
+    frame.device = Device::CPU;
+  }
+  gst_structure_get_int(struc, "width", &frame.width);
+  gst_structure_get_int(struc, "height", &frame.height);
+  std::string format_str = gst_structure_get_string(struc, "format");
+  frame.format = GetPixelFormat(format_str);
+}
+
+bool GetFrameFromSample(GstSample* sample, Frame& frame) {
+  GstBuffer* buffer = NULL;
+  GstMapInfo map;
+  const GstStructure* info = NULL;
+  GstCaps* caps = NULL;
+  int sample_width = 0;
+  int sample_height = 0;
+  do {
+    buffer = gst_sample_get_buffer(sample);
+    if (buffer == NULL) {
+      FDERROR << "Failed to get buffer from sample." << std::endl;
+      break;
+    }
+
+    gst_buffer_map(buffer, &map, GST_MAP_READ);
+
+    if (map.data == NULL) {
+      FDERROR << "Appsink buffer data is empty." << std::endl;
+      break;
+    }
+ 
+    caps = gst_sample_get_caps(sample);
+    if (caps == NULL) {
+      FDERROR << "Failed to get caps from sample." << std::endl;
+      break;
+    }
+    frame.data = map.data;
+    GetFrameInfo(caps, frame);
+  } while (false);
+  if (buffer) gst_buffer_unmap(buffer, &map);
+  return true;
+}
+
+}  // namespace streamer
+}  // namespace fastdeploy
diff --git a/streamer/src/gstreamer/utils.h b/streamer/src/gstreamer/utils.h
new file mode 100644
index 000000000..18fde7532
--- /dev/null
+++ b/streamer/src/gstreamer/utils.h
@@ -0,0 +1,28 @@
+// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#pragma once
+
+#include "gstreamer/types.h"
+#include "fastdeploy/utils/utils.h"
+#include <gst/gst.h>
+
+namespace fastdeploy {
+namespace streamer {
+std::string GetElementName(GstElement* elem);
+std::vector<std::string> GetSinkElemNames(GstBin* bin);
+GstElement* CreatePipeline(const std::string& pipeline_desc);
+std::vector<int64_t> GetFrameShape(const Frame& frame);
+bool GetFrameFromSample(GstSample* sample, Frame& frame);
+}  // namespace streamer
+}  // namespace fastdeploy

From 75a269536a822aa373f226ec9d1adbdfe49efdcf Mon Sep 17 00:00:00 2001
From: huangjianhui <852142024@qq.com>
Date: Mon, 19 Dec 2022 10:20:29 +0800
Subject: [PATCH 76/77] [Other]Update pptinypose python predict api with
 detection_result (#692)

* Add pptinypose python api predict_with_detection_result

* Update keypointdetection result docs

* Update pptinypose predict api with detection_result
---
 .../vision/keypointdetection/pptinypose/__init__.py       | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/python/fastdeploy/vision/keypointdetection/pptinypose/__init__.py b/python/fastdeploy/vision/keypointdetection/pptinypose/__init__.py
index 49692acd3..6dfe58d98 100644
--- a/python/fastdeploy/vision/keypointdetection/pptinypose/__init__.py
+++ b/python/fastdeploy/vision/keypointdetection/pptinypose/__init__.py
@@ -41,14 +41,18 @@ class PPTinyPose(FastDeployModel):
             model_format)
         assert self.initialized, "PPTinyPose model initialize failed."
 
-    def predict(self, input_image):
+    def predict(self, input_image, detection_result=None):
         """Detect keypoints in an input image
 
         :param im: (numpy.ndarray)The input image data, 3-D array with layout HWC, BGR format
+        :param detection_result: (DetectionResult)Pre-detected boxes result, default is None
         :return: KeyPointDetectionResult
         """
         assert input_image is not None, "The input image data is None."
-        return self._model.predict(input_image)
+        if detection_result:
+            return self._model.predict(input_image, detection_result)
+        else:
+            return self._model.predict(input_image)
 
     @property
     def use_dark(self):

From 383887dede0002e36d76550b82b1410767d32862 Mon Sep 17 00:00:00 2001
From: Zeref996 <53218160+Zeref996@users.noreply.github.com>
Date: Mon, 19 Dec 2022 10:21:43 +0800
Subject: [PATCH 77/77] fix docker serving doc (#899)

Co-authored-by: PaddleCI <paddle_ci@example.com>
---
 serving/README_CN.md | 4 ++--
 serving/README_EN.md | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/serving/README_CN.md b/serving/README_CN.md
index 2c858b6f7..f49c29fa7 100644
--- a/serving/README_CN.md
+++ b/serving/README_CN.md
@@ -17,13 +17,13 @@ FastDeploy基于[Triton Inference Server](https://github.com/triton-inference-se
 #### CPU镜像
 CPU镜像仅支持Paddle/ONNX模型在CPU上进行服务化部署，支持的推理后端包括OpenVINO、Paddle Inference和ONNX Runtime
 ``` shell
-docker pull paddlepaddle/fastdeploy:1.0.0-cpu-only-21.10
+docker pull registry.baidubce.com/paddlepaddle/fastdeploy:1.0.1-cpu-only-21.10
 ```
 
 #### GPU镜像
 GPU镜像支持Paddle/ONNX模型在GPU/CPU上进行服务化部署，支持的推理后端包括OpenVINO、TensorRT、Paddle Inference和ONNX Runtime
 ```
-docker pull paddlepaddle/fastdeploy:1.0.0-gpu-cuda11.4-trt8.4-21.10
+docker pull registry.baidubce.com/paddlepaddle/fastdeploy:1.0.1-gpu-cuda11.4-trt8.4-21.10
 ```
 
 用户也可根据自身需求，参考如下文档自行编译镜像
diff --git a/serving/README_EN.md b/serving/README_EN.md
index b901567e1..51b136045 100644
--- a/serving/README_EN.md
+++ b/serving/README_EN.md
@@ -20,7 +20,7 @@ FastDeploy builds an end-to-end serving deployment based on [Triton Inference Se
 CPU images only support Paddle/ONNX models for serving deployment on CPUs, and supported inference backends include OpenVINO, Paddle Inference, and ONNX Runtime
 
 ```shell
-docker pull paddlepaddle/fastdeploy:1.0.0-cpu-only-21.10
+docker pull registry.baidubce.com/paddlepaddle/fastdeploy:1.0.1-cpu-only-21.10
 ```
 
 #### GPU Image
@@ -28,7 +28,7 @@ docker pull paddlepaddle/fastdeploy:1.0.0-cpu-only-21.10
 GPU images support Paddle/ONNX models for serving deployment on GPU and CPU, and supported inference backends including OpenVINO, TensorRT, Paddle Inference, and ONNX Runtime
 
 ```
-docker pull paddlepaddle/fastdeploy:1.0.0-gpu-cuda11.4-trt8.4-21.10
+docker pull registry.baidubce.com/paddlepaddle/fastdeploy:1.0.1-gpu-cuda11.4-trt8.4-21.10
 ```
 
 Users can also compile the image by themselves according to their own needs, referring to the following documents: