mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-09-27 12:52:29 +08:00
fix config (#2858)
This commit is contained in:
@@ -59,6 +59,7 @@ PRETRAINED_INIT_CONFIGURATION = {
|
||||
"tie_word_embeddings":False,
|
||||
"rms_norm_eps":1e-5,
|
||||
"moe_num_experts": None,
|
||||
"moe_layer_end_index":None,
|
||||
}
|
||||
|
||||
|
||||
@@ -330,7 +331,7 @@ class GraphOptimizationConfig:
|
||||
if len(dedup_sizes) < len(self.cudagraph_capture_sizes):
|
||||
logger.info(("cudagraph sizes specified by model runner"
|
||||
" %s is overridden by config %s"),
|
||||
cudagraph_capture_sizes, dedup_sizes)
|
||||
self.cudagraph_capture_sizes, dedup_sizes)
|
||||
self.cudagraph_capture_sizes = dedup_sizes
|
||||
|
||||
# Sort to make sure cudagraph capture sizes are in descending order
|
||||
|
Reference in New Issue
Block a user