[Metax] adapt DeepSeek (#4498)

2025-12-24 13:28:13 +08:00 · 2025-10-24 10:14:53 +08:00
parent 8718fa34b2
commit f7069b8057
19 changed files with 1538 additions and 324 deletions
--- a/fastdeploy/model_executor/model_loader/default_loader.py
+++ b/fastdeploy/model_executor/model_loader/default_loader.py
@@ -43,12 +43,12 @@ class DefaultModelLoader(BaseModelLoader):

    def clean_memory_fragments(self, state_dict: dict) -> None:
        """clean_memory_fragments"""
-        if current_platform.is_cuda():
+        if current_platform.is_cuda() or current_platform.is_maca():
            if state_dict:
                for k, v in state_dict.items():
                    if isinstance(v, paddle.Tensor):
                        v.value().get_tensor()._clear()
-            paddle.device.cuda.empty_cache()
+            paddle.device.empty_cache()
            paddle.device.synchronize()

    @measure_time()