From b52971749c4ec06e70a1b760ecb704ef1d26e3c1 Mon Sep 17 00:00:00 2001 From: qw86972190 <127910106+qw86972190@users.noreply.github.com> Date: Wed, 17 Sep 2025 20:01:55 +0800 Subject: [PATCH] Print KV Cache available memory and block memory usage in GB format (#4148) --- fastdeploy/worker/worker_process.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/fastdeploy/worker/worker_process.py b/fastdeploy/worker/worker_process.py index 411418977..e9dca5884 100644 --- a/fastdeploy/worker/worker_process.py +++ b/fastdeploy/worker/worker_process.py @@ -382,7 +382,7 @@ class PaddleDisWorkerProc: if num_blocks_local > 40000: logger.info(f"------- Reset num_blocks_local {num_blocks_local} to 40000") num_blocks_local = min(40000, num_blocks_local) - logger.info(f"------- model_block_memory_used:{model_block_memory_used} --------") + logger.info(f"------- model_block_memory_used:{model_block_memory_used / 1024**3} GB --------") logger.info(f"------- num_blocks_local:{num_blocks_local} --------") if num_blocks_local <= 0: