Add Quantization Function. (#256)

* Add PaddleOCR Support * Add PaddleOCR Support * Add PaddleOCRv3 Support * Add PaddleOCRv3 Support * Update README.md * Update README.md * Update README.md * Update README.md * Add PaddleOCRv3 Support * Add PaddleOCRv3 Supports * Add PaddleOCRv3 Suport * Fix Rec diff * Remove useless functions * Remove useless comments * Add PaddleOCRv2 Support * Add PaddleOCRv3 & PaddleOCRv2 Support * remove useless parameters * Add utils of sorting det boxes * Fix code naming convention * Fix code naming convention * Fix code naming convention * Fix bug in the Classify process * Imporve OCR Readme * Fix diff in Cls model * Update Model Download Link in Readme * Fix diff in PPOCRv2 * Improve OCR readme * Imporve OCR readme * Improve OCR readme * Improve OCR readme * Imporve OCR readme * Improve OCR readme * Fix conflict * Add readme for OCRResult * Improve OCR readme * Add OCRResult readme * Improve OCR readme * Improve OCR readme * Add Model Quantization Demo * Fix Model Quantization Readme * Fix Model Quantization Readme * Add the function to do PTQ quantization * Improve quant tools readme * Improve quant tool readme * Improve quant tool readme * Add PaddleInference-GPU for OCR Rec model * Add QAT method to fastdeploy-quantization tool * Remove examples/slim for now * Move configs folder * Add Quantization Support for Classification Model * Imporve ways of importing preprocess * Upload YOLO Benchmark on readme * Upload YOLO Benchmark on readme * Upload YOLO Benchmark on readme * Improve Quantization configs and readme * Add support for multi-inputs model
2025-12-24 13:28:13 +08:00 · 2022-10-08 15:45:28 +08:00
parent 8d47637541
commit 1efc0fa6b0
13 changed files with 736 additions and 0 deletions
--- a/tools/quantization/fdquant/init.py
+++ b/tools/quantization/fdquant/init.py
--- a/tools/quantization/fdquant/dataset.py
+++ b/tools/quantization/fdquant/dataset.py
@@ -0,0 +1,150 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import cv2
+import os
+import numpy as np
+import paddle
+
+
+def generate_scale(im, target_shape):
+    origin_shape = im.shape[:2]
+    im_size_min = np.min(origin_shape)
+    im_size_max = np.max(origin_shape)
+    target_size_min = np.min(target_shape)
+    target_size_max = np.max(target_shape)
+    im_scale = float(target_size_min) / float(im_size_min)
+    if np.round(im_scale * im_size_max) > target_size_max:
+        im_scale = float(target_size_max) / float(im_size_max)
+    im_scale_x = im_scale
+    im_scale_y = im_scale
+
+    return im_scale_y, im_scale_x
+
+
+def yolo_image_preprocess(img, target_shape=[640, 640]):
+    # Resize image
+    im_scale_y, im_scale_x = generate_scale(img, target_shape)
+    img = cv2.resize(
+        img,
+        None,
+        None,
+        fx=im_scale_x,
+        fy=im_scale_y,
+        interpolation=cv2.INTER_LINEAR)
+    # Pad
+    im_h, im_w = img.shape[:2]
+    h, w = target_shape[:]
+    if h != im_h or w != im_w:
+        canvas = np.ones((h, w, 3), dtype=np.float32)
+        canvas *= np.array([114.0, 114.0, 114.0], dtype=np.float32)
+        canvas[0:im_h, 0:im_w, :] = img.astype(np.float32)
+        img = canvas
+    img = np.transpose(img / 255, [2, 0, 1])
+
+    return img.astype(np.float32)
+
+
+def cls_resize_short(img, target_size):
+
+    img_h, img_w = img.shape[:2]
+    percent = float(target_size) / min(img_w, img_h)
+    w = int(round(img_w * percent))
+    h = int(round(img_h * percent))
+
+    return cv2.resize(img, (w, h), interpolation=cv2.INTER_LINEAR)
+
+
+def crop_image(img, target_size, center):
+
+    height, width = img.shape[:2]
+    size = target_size
+
+    if center == True:
+        w_start = (width - size) // 2
+        h_start = (height - size) // 2
+    else:
+        w_start = np.random.randint(0, width - size + 1)
+        h_start = np.random.randint(0, height - size + 1)
+    w_end = w_start + size
+    h_end = h_start + size
+
+    return img[h_start:h_end, w_start:w_end, :]
+
+
+def cls_image_preprocess(img):
+
+    # resize
+    img = cls_resize_short(img, target_size=256)
+    # crop
+    img = crop_image(img, target_size=224, center=True)
+
+    #ToCHWImage & Normalize
+    img = np.transpose(img / 255, [2, 0, 1])
+
+    img_mean = np.array([0.485, 0.456, 0.406]).reshape((3, 1, 1))
+    img_std = np.array([0.229, 0.224, 0.225]).reshape((3, 1, 1))
+    img -= img_mean
+    img /= img_std
+
+    return img.astype(np.float32)
+
+
+def ppdet_resize_no_keepratio(img, target_shape=[640, 640]):
+    im_shape = img.shape
+
+    resize_h, resize_w = target_shape
+    im_scale_y = resize_h / im_shape[0]
+    im_scale_x = resize_w / im_shape[1]
+
+    scale_factor = np.asarray([im_scale_y, im_scale_x], dtype=np.float32)
+    return cv2.resize(
+        img, None, None, fx=im_scale_x, fy=im_scale_y,
+        interpolation=2), scale_factor
+
+
+def ppdet_normliaze(img, is_scale=True):
+
+    mean = [0.485, 0.456, 0.406]
+    std = [0.229, 0.224, 0.225]
+    img = img.astype(np.float32, copy=False)
+
+    if is_scale:
+        scale = 1.0 / 255.0
+        img *= scale
+
+    mean = np.array(mean)[np.newaxis, np.newaxis, :]
+    std = np.array(std)[np.newaxis, np.newaxis, :]
+    img -= mean
+    img /= std
+    return img
+
+
+def hwc_to_chw(img):
+    img = img.transpose((2, 0, 1))
+    return img
+
+
+def ppdet_image_preprocess(img):
+
+    img, scale_factor = ppdet_resize_no_keepratio(img, target_shape=[640, 640])
+
+    img = np.transpose(img / 255, [2, 0, 1])
+
+    img_mean = np.array([0.485, 0.456, 0.406]).reshape((3, 1, 1))
+    img_std = np.array([0.229, 0.224, 0.225]).reshape((3, 1, 1))
+    img -= img_mean
+    img /= img_std
+
+    return img.astype(np.float32), scale_factor
--- a/tools/quantization/fdquant/fdquant.py
+++ b/tools/quantization/fdquant/fdquant.py
@@ -0,0 +1,155 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import sys
+import numpy as np
+import time
+import argparse
+from tqdm import tqdm
+import paddle
+from paddleslim.common import load_config, load_onnx_model
+from paddleslim.auto_compression import AutoCompression
+from paddleslim.quant import quant_post_static
+from fdquant.dataset import *
+
+
+def argsparser():
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument(
+        '--config_path',
+        type=str,
+        default=None,
+        help="path of compression strategy config.",
+        required=True)
+    parser.add_argument(
+        '--method',
+        type=str,
+        default=None,
+        help="choose PTQ or QAT as quantization method",
+        required=True)
+    parser.add_argument(
+        '--save_dir',
+        type=str,
+        default='output',
+        help="directory to save compressed model.")
+    parser.add_argument(
+        '--devices',
+        type=str,
+        default='gpu',
+        help="which device used to compress.")
+
+    return parser
+
+
+def reader_wrapper(reader, input_list=None):
+    def gen():
+        for data_list in reader:
+            in_dict = {}
+            for data in data_list:
+                for i, input_name in enumerate(input_list):
+                    in_dict[input_name] = data[i]
+                yield in_dict
+
+    return gen
+
+
+def main():
+
+    time_s = time.time()
+
+    paddle.enable_static()
+    parser = argsparser()
+    FLAGS = parser.parse_args()
+
+    assert FLAGS.devices in ['cpu', 'gpu', 'xpu', 'npu']
+    paddle.set_device(FLAGS.devices)
+
+    global global_config
+    all_config = load_config(FLAGS.config_path)
+    assert "Global" in all_config, f"Key 'Global' not found in config file. \n{all_config}"
+    global_config = all_config["Global"]
+    input_list = global_config['input_list']
+
+    assert os.path.exists(global_config[
+        'image_path']), "image_path does not exist!"
+    paddle.vision.image.set_image_backend('cv2')
+    # transform could be customized.
+    train_dataset = paddle.vision.datasets.ImageFolder(
+        global_config['image_path'],
+        transform=eval(global_config['preprocess']))
+    train_loader = paddle.io.DataLoader(
+        train_dataset,
+        batch_size=1,
+        shuffle=True,
+        drop_last=True,
+        num_workers=0)
+    train_loader = reader_wrapper(train_loader, input_list=input_list)
+    eval_func = None
+
+    # ACT compression
+    if FLAGS.method == 'QAT':
+        ac = AutoCompression(
+            model_dir=global_config['model_dir'],
+            model_filename=global_config['model_filename'],
+            params_filename=global_config['params_filename'],
+            train_dataloader=train_loader,
+            save_dir=FLAGS.save_dir,
+            config=all_config,
+            eval_callback=eval_func)
+        ac.compress()
+
+    # PTQ compression
+    if FLAGS.method == 'PTQ':
+
+        # Read PTQ config
+        assert "PTQ" in all_config, f"Key 'PTQ' not found in config file. \n{all_config}"
+        ptq_config = all_config["PTQ"]
+
+        # Inititalize the executor
+        place = paddle.CUDAPlace(
+            0) if FLAGS.devices == 'gpu' else paddle.CPUPlace()
+        exe = paddle.static.Executor(place)
+
+        # Read ONNX or PADDLE format model
+        if global_config['format'] == 'onnx':
+            load_onnx_model(global_config["model_dir"])
+            inference_model_path = global_config["model_dir"].rstrip().rstrip(
+                '.onnx') + '_infer'
+        else:
+            inference_model_path = global_config["model_dir"].rstrip('/')
+
+        quant_post_static(
+            executor=exe,
+            model_dir=inference_model_path,
+            quantize_model_path=FLAGS.save_dir,
+            data_loader=train_loader,
+            model_filename=global_config["model_filename"],
+            params_filename=global_config["params_filename"],
+            batch_size=32,
+            batch_nums=10,
+            algo=ptq_config['calibration_method'],
+            hist_percent=0.999,
+            is_full_quantize=False,
+            bias_correction=False,
+            onnx_format=True,
+            skip_tensor_list=ptq_config['skip_tensor_list']
+            if 'skip_tensor_list' in ptq_config else None)
+
+    time_total = time.time() - time_s
+    print("Finish Compression, total time used is : ", time_total, "seconds.")
+
+
+if __name__ == '__main__':
+    main()