Skip to content

Commit d70aacf

Browse files
authored
[FDConfig] Turn on the CUDAGraph + MultiModel switch (#4512)
1 parent 809c1ac commit d70aacf

File tree

1 file changed

+3
-10
lines changed

1 file changed

+3
-10
lines changed

fastdeploy/config.py

Lines changed: 3 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1510,14 +1510,12 @@ def postprocess(self):
15101510
self.structured_outputs_config.guided_decoding_backend = "xgrammar"
15111511

15121512
# Adjustment GraphOptConfig
1513-
if (
1514-
(self.scheduler_config.splitwise_role != "mixed")
1515-
or (self.model_config is not None and self.model_config.enable_mm is True)
1516-
or (self.load_config is not None and self.load_config.dynamic_load_weight is True)
1513+
if (self.scheduler_config.splitwise_role != "mixed") or (
1514+
self.load_config is not None and self.load_config.dynamic_load_weight is True
15171515
):
15181516
self.graph_opt_config.use_cudagraph = False
15191517
logger.info(
1520-
"CUDAGraph does not support to be started together with MultiModel temporarily, but has been automatically closed!"
1518+
"CUDAGraph does not support to be started together with PD Disaggregation temporarily, but has been automatically closed!"
15211519
)
15221520
if self.load_config is not None and self.load_config.dynamic_load_weight is True:
15231521
self.graph_opt_config.graph_opt_level = 0
@@ -1632,11 +1630,6 @@ def check(self):
16321630
self.scheduler_config.check()
16331631

16341632
# Check graph optimization config
1635-
if self.graph_opt_config.use_cudagraph:
1636-
if self.model_config is not None:
1637-
assert (
1638-
self.model_config.enable_mm is not True
1639-
), "CUDAGraph cannot be applied to multimodal model temporarily"
16401633
if self.graph_opt_config.graph_opt_level > 0 or self.graph_opt_config.use_cudagraph:
16411634
if self.load_config is not None:
16421635
assert (

0 commit comments

Comments
 (0)