mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
[Feature] support seed parameter (#3161)
* support seed * fix * add SamplingMetadata seed test * The next_tokens values are inconsistent! * add air and rejection seed test * fix * add SamplingParams seed test * fix seed=0 * Default to defualt * fix * fix args_utils * fix review * fix review * fix * fix * add xpu,gcu,iluvatar support seed * fix
This commit is contained in:
@@ -23,7 +23,7 @@ from paddle import nn
|
||||
from fastdeploy import envs
|
||||
from fastdeploy.config import FDConfig
|
||||
from fastdeploy.engine.request import Request
|
||||
from fastdeploy.utils import get_logger
|
||||
from fastdeploy.utils import get_logger, set_random_seed
|
||||
from fastdeploy.worker.output import ModelRunnerOutput
|
||||
from fastdeploy.worker.worker_base import WorkerBase
|
||||
from fastdeploy.worker.xpu_model_runner import XPUModelRunner
|
||||
@@ -60,6 +60,7 @@ class XpuWorker(WorkerBase):
|
||||
else:
|
||||
raise RuntimeError(f"Not support device type: {self.device_config.device}")
|
||||
|
||||
set_random_seed(self.fd_config.model_config.seed)
|
||||
# Construct model runner
|
||||
self.model_runner: XPUModelRunner = XPUModelRunner(
|
||||
fd_config=self.fd_config,
|
||||
@@ -110,6 +111,7 @@ class XpuWorker(WorkerBase):
|
||||
|
||||
self.model_runner.prepare_profile()
|
||||
self.model_runner.profile_run()
|
||||
set_random_seed(self.fd_config.model_config.seed)
|
||||
|
||||
total_available_memory = int(total_memory * self.cache_config.gpu_memory_utilization)
|
||||
used_memory = xpu_get_used_global_memory(int(self.device_ids[self.local_rank]))
|
||||
|
Reference in New Issue
Block a user