@@ -1510,14 +1510,12 @@ def postprocess(self):
15101510 self .structured_outputs_config .guided_decoding_backend = "xgrammar"
15111511
15121512 # Adjustment GraphOptConfig
1513- if (
1514- (self .scheduler_config .splitwise_role != "mixed" )
1515- or (self .model_config is not None and self .model_config .enable_mm is True )
1516- or (self .load_config is not None and self .load_config .dynamic_load_weight is True )
1513+ if (self .scheduler_config .splitwise_role != "mixed" ) or (
1514+ self .load_config is not None and self .load_config .dynamic_load_weight is True
15171515 ):
15181516 self .graph_opt_config .use_cudagraph = False
15191517 logger .info (
1520- "CUDAGraph does not support to be started together with MultiModel temporarily, but has been automatically closed!"
1518+ "CUDAGraph does not support to be started together with PD Disaggregation temporarily, but has been automatically closed!"
15211519 )
15221520 if self .load_config is not None and self .load_config .dynamic_load_weight is True :
15231521 self .graph_opt_config .graph_opt_level = 0
@@ -1632,11 +1630,6 @@ def check(self):
16321630 self .scheduler_config .check ()
16331631
16341632 # Check graph optimization config
1635- if self .graph_opt_config .use_cudagraph :
1636- if self .model_config is not None :
1637- assert (
1638- self .model_config .enable_mm is not True
1639- ), "CUDAGraph cannot be applied to multimodal model temporarily"
16401633 if self .graph_opt_config .graph_opt_level > 0 or self .graph_opt_config .use_cudagraph :
16411634 if self .load_config is not None :
16421635 assert (
0 commit comments