File tree Expand file tree Collapse file tree 2 files changed +5
-5
lines changed Expand file tree Collapse file tree 2 files changed +5
-5
lines changed Original file line number Diff line number Diff line change @@ -49,7 +49,7 @@ def parse_args():
4949 parser .add_argument (
5050 "--gpu_memory_utilization" ,
5151 type = float ,
52- default = 0.85 ,
52+ default = 0.95 ,
5353 help = "GPU memory utilization for vLLM (default: 0.85)" ,
5454 )
5555 parser .add_argument (
Original file line number Diff line number Diff line change @@ -154,7 +154,7 @@ def _load_qwen3_vl(
154154 def _engine_args_kimi_vl (self ) -> EngineArgs :
155155 return EngineArgs (
156156 model = self .model_id ,
157- max_model_len = 32768 ,
157+ max_model_len = 8192 ,
158158 trust_remote_code = True ,
159159 limit_mm_per_prompt = {self .modality : 5 },
160160 )
@@ -272,11 +272,11 @@ def _load_deepseek_vl2(
272272 def _engine_args_glm4_5v (self ) -> EngineArgs :
273273 return EngineArgs (
274274 model = self .model_id ,
275- max_model_len = 32768 ,
275+ max_model_len = 8192 ,
276276 max_num_seqs = 2 ,
277277 trust_remote_code = True ,
278278 enforce_eager = True ,
279- limit_mm_per_prompt = {self . modality : 5 },
279+ limit_mm_per_prompt = {"image" : 5 , "video" : 0 },
280280 )
281281
282282 def _load_glm4_5v (
@@ -359,7 +359,7 @@ def _load_ovis2(
359359 def _engine_args_ovis2_5 (self ) -> EngineArgs :
360360 return EngineArgs (
361361 model = self .model_id ,
362- max_model_len = 4096 ,
362+ max_model_len = 8192 ,
363363 max_num_seqs = 2 ,
364364 trust_remote_code = True ,
365365 dtype = "half" ,
You can’t perform that action at this time.
0 commit comments