mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
5 lines
100 B
YAML
5 lines
100 B
YAML
model: "baidu/ERNIE-45-300B-A47B-Paddle"
|
|
max_model_len: 32768
|
|
max_num_seqs: 128
|
|
kv_cache_ratio: 0.5
|