mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 16:48:03 +08:00
qwen loader (#3057)
This commit is contained in:
@@ -54,6 +54,7 @@ class Config:
|
||||
splitwise_role (str): Splitwise role.
|
||||
innode_prefill_ports (Optional[List[int]]): Innode prefill ports.
|
||||
Temporary configuration, will be removed in the future.
|
||||
load_choices(str):The format of the model weights to load. .Default is default
|
||||
"""
|
||||
|
||||
def __init__(
|
||||
@@ -88,6 +89,7 @@ class Config:
|
||||
disable_any_whitespace: bool = False,
|
||||
enable_logprob: bool = False,
|
||||
early_stop_config: Optional[Dict[str, Any]] = None,
|
||||
load_choices: str = "default",
|
||||
):
|
||||
"""
|
||||
Initialize the Config class.
|
||||
@@ -118,6 +120,7 @@ class Config:
|
||||
Default is False.
|
||||
enable_logprob(bool): Enable logprob. Default is False.
|
||||
early_stop_config (Optional[Dict[str, Any]]): Early stop configuration. Default is None.
|
||||
load_choices(str):The format of the model weights to load. .Default is default
|
||||
"""
|
||||
self.model_config = model_config
|
||||
self.cache_config = cache_config
|
||||
@@ -167,6 +170,7 @@ class Config:
|
||||
self.guided_decoding_backend = guided_decoding_backend
|
||||
self.disable_any_whitespace = disable_any_whitespace
|
||||
self._str_to_list("innode_prefill_ports", int)
|
||||
self.load_choices = load_choices
|
||||
|
||||
assert self.splitwise_role in ["mixed", "prefill", "decode"]
|
||||
|
||||
|
Reference in New Issue
Block a user