mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-03 15:56:49 +08:00
fix config (#2858)
This commit is contained in:
@@ -59,6 +59,7 @@ PRETRAINED_INIT_CONFIGURATION = {
|
|||||||
"tie_word_embeddings":False,
|
"tie_word_embeddings":False,
|
||||||
"rms_norm_eps":1e-5,
|
"rms_norm_eps":1e-5,
|
||||||
"moe_num_experts": None,
|
"moe_num_experts": None,
|
||||||
|
"moe_layer_end_index":None,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@@ -330,7 +331,7 @@ class GraphOptimizationConfig:
|
|||||||
if len(dedup_sizes) < len(self.cudagraph_capture_sizes):
|
if len(dedup_sizes) < len(self.cudagraph_capture_sizes):
|
||||||
logger.info(("cudagraph sizes specified by model runner"
|
logger.info(("cudagraph sizes specified by model runner"
|
||||||
" %s is overridden by config %s"),
|
" %s is overridden by config %s"),
|
||||||
cudagraph_capture_sizes, dedup_sizes)
|
self.cudagraph_capture_sizes, dedup_sizes)
|
||||||
self.cudagraph_capture_sizes = dedup_sizes
|
self.cudagraph_capture_sizes = dedup_sizes
|
||||||
|
|
||||||
# Sort to make sure cudagraph capture sizes are in descending order
|
# Sort to make sure cudagraph capture sizes are in descending order
|
||||||
|
Reference in New Issue
Block a user