@@ -99,14 +99,14 @@ jobs:
9999 # pytest -sv tests/e2e/singlecard/test_embedding_aclgraph.py
100100 #s pytest -sv tests/e2e/singlecard/test_guided_decoding.py
101101 #s pytest -sv tests/e2e/singlecard/test_ilama_lora.py
102- pytest -sv tests/e2e/singlecard/test_profile_execute_duration.py
103- pytest -sv tests/e2e/singlecard/test_quantization.py
104- pytest -sv tests/e2e/singlecard/test_sampler.py
105- pytest -sv tests/e2e/singlecard/test_vlm.py
106- pytest -sv tests/e2e/singlecard/multi-modal/test_internvl.py
102+ #s pytest -sv tests/e2e/singlecard/test_profile_execute_duration.py
103+ #s pytest -sv tests/e2e/singlecard/test_quantization.py
104+ #s pytest -sv tests/e2e/singlecard/test_sampler.py
105+ #s pytest -sv tests/e2e/singlecard/test_vlm.py
106+ #s pytest -sv tests/e2e/singlecard/multi-modal/test_internvl.py
107107
108108 # ------------------------------------ v1 spec decode test ------------------------------------ #
109- pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_correctness.py
109+ #s pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_correctness.py
110110 pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_torchair_correctness.py
111111 # Fix me: test_eagle_correctness OOM error
112112 pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py
@@ -188,20 +188,20 @@ jobs:
188188 pytest -sv tests/e2e/multicard/test_ilama_lora_tp2.py
189189
190190 # To avoid oom, we need to run the test in a single process.
191- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_QwQ
192- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek_multistream_moe
193- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen3_W8A8
194- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen3_W4A8DYNAMIC_new_version
195- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen3_W4A8DYNAMIC_old_version
196- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek_W4A8DYNAMIC
197- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_sp_for_qwen3_moe
198- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_fc2_for_qwen3_moe
199- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen_Dense_with_flashcomm_v1
200- pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen_Dense_with_prefetch_mlp_weight
201-
202- pytest -sv tests/e2e/multicard/test_pipeline_parallel.py
203- pytest -sv tests/e2e/multicard/test_prefix_caching.py
204- pytest -sv tests/e2e/multicard/test_qwen3_moe.py
191+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_QwQ
192+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek_multistream_moe
193+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen3_W8A8
194+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen3_W4A8DYNAMIC_new_version
195+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen3_W4A8DYNAMIC_old_version
196+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek_W4A8DYNAMIC
197+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_sp_for_qwen3_moe
198+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_fc2_for_qwen3_moe
199+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen_Dense_with_flashcomm_v1
200+ #s pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen_Dense_with_prefetch_mlp_weight
201+
202+ #s pytest -sv tests/e2e/multicard/test_pipeline_parallel.py
203+ #s pytest -sv tests/e2e/multicard/test_prefix_caching.py
204+ #s pytest -sv tests/e2e/multicard/test_qwen3_moe.py
205205
206206 e2e-4-cards :
207207 name : multicard-4
@@ -284,4 +284,4 @@ jobs:
284284 VLLM_USE_MODELSCOPE : True
285285 run : |
286286 . /usr/local/Ascend/8.3.RC1/bisheng_toolkit/set_env.sh
287- # pytest -sv tests/e2e/multicard/test_qwen3_next.py
287+ pytest -sv tests/e2e/multicard/test_qwen3_next.py
0 commit comments