Skip to content

Commit 096d87d

Browse files
authored
fix bug (#4679)
1 parent 0f75b62 commit 096d87d

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

fastdeploy/config.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1556,6 +1556,10 @@ def postprocess(self):
15561556
self.graph_opt_config.use_cudagraph = False
15571557
logger.info(f"CUDAGraph only support on GPU, current device type is {self.device_config.device_type}!")
15581558

1559+
if self.model_config.enable_mm and self.graph_opt_config.use_cudagraph:
1560+
self.cache_config.enable_prefix_caching = False
1561+
logger.info("Multi-modal models do not support prefix caching when using CUDAGraph!")
1562+
15591563
if self.scheduler_config.splitwise_role == "mixed":
15601564
self.model_config.moe_phase = MoEPhase(phase="prefill")
15611565
elif self.scheduler_config.splitwise_role == "prefill":

0 commit comments

Comments
 (0)