mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-09-29 22:02:30 +08:00
Update cache_messager.py (#3172)
This commit is contained in:
@@ -142,7 +142,7 @@ class CacheMessager:
|
||||
|
||||
self.gpu_id = gpu_id
|
||||
self.cache_info = dict()
|
||||
self.dp_rank_id = local_data_parallel_id
|
||||
self.dp_rank_id = self.rank + local_data_parallel_id * self.nranks
|
||||
|
||||
layerwise_send_cache_thread = threading.Thread(target=self._prefill_layerwise_send_cache_thread)
|
||||
layerwise_send_cache_thread.daemon = True
|
||||
|
Reference in New Issue
Block a user