fix bug (#4679)

2025-12-24 13:28:13 +08:00 · 2025-10-31 14:59:18 +08:00
parent 0f75b62de2
commit 096d87d335
1 changed files with 4 additions and 0 deletions
--- a/fastdeploy/config.py
+++ b/fastdeploy/config.py
@@ -1556,6 +1556,10 @@ class FDConfig:
            self.graph_opt_config.use_cudagraph = False
            logger.info(f"CUDAGraph only support on GPU, current device type is {self.device_config.device_type}!")

+        if self.model_config.enable_mm and self.graph_opt_config.use_cudagraph:
+            self.cache_config.enable_prefix_caching = False
+            logger.info("Multi-modal models do not support prefix caching when using CUDAGraph!")
+
        if self.scheduler_config.splitwise_role == "mixed":
            self.model_config.moe_phase = MoEPhase(phase="prefill")
        elif self.scheduler_config.splitwise_role == "prefill":