mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
Unify server-side and model-side Config (Part1) (#3018)
* move cache config * fix mtp
This commit is contained in:
@@ -137,7 +137,7 @@ class GpuWorker(WorkerBase):
|
||||
pynvml.nvmlShutdown()
|
||||
|
||||
available_kv_cache_memory = (
|
||||
after_run_meminfo.total * self.parallel_config.gpu_memory_utilization
|
||||
after_run_meminfo.total * self.cache_config.gpu_memory_utilization
|
||||
- after_run_meminfo.used
|
||||
- paddle_peak_increase
|
||||
)
|
||||
|
Reference in New Issue
Block a user