mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 00:33:03 +08:00
[stop sequence] support stop sequence (#3025)
* stop seqs in multi-ends * unittest for gpu stop op * kernel tid==0
This commit is contained in:
@@ -101,9 +101,6 @@ class ModelConfig:
|
||||
self,
|
||||
args,
|
||||
):
|
||||
self.max_stop_seqs_num = 5
|
||||
self.stop_seqs_max_len = 8
|
||||
|
||||
# NOTE(gongshaotain): form _load_model_init_val()
|
||||
self.top_p = 1.0
|
||||
self.temperature = 1.0
|
||||
@@ -122,6 +119,9 @@ class ModelConfig:
|
||||
self.enable_redundant_experts = False
|
||||
self.redundant_experts_num = 0
|
||||
|
||||
self.max_stop_seqs_num = int(envs.FD_MAX_STOP_SEQS_NUM)
|
||||
self.stop_seqs_max_len = int(envs.FD_STOP_SEQS_MAX_LEN)
|
||||
|
||||
for key, value in args.items():
|
||||
if hasattr(self, key):
|
||||
setattr(self, key, value)
|
||||
|
Reference in New Issue
Block a user