mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Quantization] Update auto compression configs files. (#846)
* Fix links in readme * Fix links in readme * Update PPOCRv2/v3 examples * Update auto compression configs
This commit is contained in:
@@ -24,7 +24,7 @@ Distillation:
|
||||
alpha: 1.0 #蒸馏loss所占权重
|
||||
loss: soft_label #蒸馏loss算法
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
onnx_format: true #是否采用ONNX量化标准格式, 要在FastDeploy上部署, 必须选true
|
||||
use_pact: true #量化训练是否使用PACT方法
|
||||
activation_quantize_type: 'moving_average_abs_max' #激活量化方式
|
||||
|
||||
@@ -26,7 +26,7 @@ Distillation:
|
||||
alpha: 1.0 #Distillation loss weight
|
||||
loss: soft_label #Distillation loss algorithm
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
onnx_format: true #Whether to use ONNX quantization standard format or not, must be true to deploy on FastDeploy
|
||||
use_pact: true #Whether to use the PACT method for training
|
||||
activation_quantize_type: 'moving_average_abs_max' #Activations quantization methods
|
||||
|
||||
@@ -17,7 +17,7 @@ Distillation:
|
||||
- softmax_0.tmp_0
|
||||
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
use_pact: true
|
||||
activation_bits: 8
|
||||
is_full_quantize: false
|
||||
|
||||
@@ -16,7 +16,7 @@ Distillation:
|
||||
node:
|
||||
- softmax_0.tmp_0
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
use_pact: true
|
||||
activation_bits: 8
|
||||
is_full_quantize: false
|
||||
|
||||
@@ -14,7 +14,7 @@ Distillation:
|
||||
alpha: 1.0
|
||||
loss: soft_label
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
onnx_format: true
|
||||
use_pact: true
|
||||
activation_quantize_type: 'moving_average_abs_max'
|
||||
|
||||
@@ -14,7 +14,7 @@ Distillation:
|
||||
alpha: 1.0
|
||||
loss: soft_label
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
onnx_format: true
|
||||
use_pact: true
|
||||
activation_quantize_type: 'moving_average_abs_max'
|
||||
|
||||
@@ -14,7 +14,7 @@ Distillation:
|
||||
alpha: 1.0
|
||||
loss: soft_label
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
onnx_format: true
|
||||
use_pact: true
|
||||
activation_quantize_type: 'moving_average_abs_max'
|
||||
|
||||
@@ -14,12 +14,13 @@ Distillation:
|
||||
alpha: 1.0
|
||||
loss: soft_label
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
onnx_format: true
|
||||
activation_quantize_type: 'moving_average_abs_max'
|
||||
quantize_op_types:
|
||||
- conv2d
|
||||
- depthwise_conv2d
|
||||
- conv2d_transpose
|
||||
|
||||
|
||||
PTQ:
|
||||
|
||||
@@ -14,7 +14,7 @@ Distillation:
|
||||
alpha: 1.0
|
||||
loss: soft_label
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
onnx_format: true
|
||||
activation_quantize_type: 'moving_average_abs_max'
|
||||
quantize_op_types:
|
||||
|
||||
@@ -17,7 +17,7 @@ Distillation:
|
||||
node:
|
||||
- conv2d_94.tmp_0
|
||||
|
||||
Quantization:
|
||||
QuantAware:
|
||||
onnx_format: True
|
||||
quantize_op_types:
|
||||
- conv2d
|
||||
|
||||
Reference in New Issue
Block a user