mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 16:48:03 +08:00
Update cache_messager.py (#3173)
This commit is contained in:
@@ -142,7 +142,7 @@ class CacheMessager:
|
|||||||
|
|
||||||
self.gpu_id = gpu_id
|
self.gpu_id = gpu_id
|
||||||
self.cache_info = dict()
|
self.cache_info = dict()
|
||||||
self.dp_rank_id = local_data_parallel_id
|
self.dp_rank_id = self.rank + local_data_parallel_id * self.nranks
|
||||||
|
|
||||||
layerwise_send_cache_thread = threading.Thread(target=self._prefill_layerwise_send_cache_thread)
|
layerwise_send_cache_thread = threading.Thread(target=self._prefill_layerwise_send_cache_thread)
|
||||||
layerwise_send_cache_thread.daemon = True
|
layerwise_send_cache_thread.daemon = True
|
||||||
|
Reference in New Issue
Block a user