mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-18 14:40:44 +08:00
@@ -70,7 +70,7 @@ class ModelConfig:
|
|||||||
self.stop_seqs_max_len = 8
|
self.stop_seqs_max_len = 8
|
||||||
|
|
||||||
# NOTE(gongshaotain): form _load_model_init_val()
|
# NOTE(gongshaotain): form _load_model_init_val()
|
||||||
self.top_p = 0.0
|
self.top_p = 1.0
|
||||||
self.temperature = 1.0
|
self.temperature = 1.0
|
||||||
self.rope_theta = 10000.0
|
self.rope_theta = 10000.0
|
||||||
self.penalty_score = 1.0
|
self.penalty_score = 1.0
|
||||||
|
@@ -419,7 +419,6 @@ class GPUModelRunner(ModelRunnerBase):
|
|||||||
self.share_inputs["max_dec_len"][idx:idx + 1] = max_dec_len
|
self.share_inputs["max_dec_len"][idx:idx + 1] = max_dec_len
|
||||||
self.share_inputs["min_dec_len"][idx:idx + 1] = max_dec_len
|
self.share_inputs["min_dec_len"][idx:idx + 1] = max_dec_len
|
||||||
self.share_inputs["stop_flags"][idx:idx + 1] = False
|
self.share_inputs["stop_flags"][idx:idx + 1] = False
|
||||||
self.share_inputs["top_p"][idx:idx + 1] = 0.0
|
|
||||||
self.share_inputs["temperature"][idx:idx + 1] = 1
|
self.share_inputs["temperature"][idx:idx + 1] = 1
|
||||||
|
|
||||||
self.share_inputs["first_token_ids"][
|
self.share_inputs["first_token_ids"][
|
||||||
|
Reference in New Issue
Block a user