2525 env :
2626 VLLM_LOGGING_LEVEL : ERROR
2727 VLLM_USE_MODELSCOPE : True
28+ TRANSFORMERS_OFFLINE : 1
2829 steps :
2930 - name : Check npu and CANN info
3031 run : |
7475 PYTORCH_NPU_ALLOC_CONF : max_split_size_mb:256
7576 if : ${{ inputs.type == 'light' }}
7677 run : |
77- # pytest -sv tests/e2e/singlecard/test_aclgraph .py
78+ # pytest -sv tests/e2e/singlecard/test_aclgraph_accuracy .py
7879 # pytest -sv tests/e2e/singlecard/test_quantization.py
7980 pytest -sv tests/e2e/singlecard/test_vlm.py::test_multimodal_vl
81+ pytest -sv tests/e2e/singlecard/pooling/test_classification.py::test_classify_correctness
8082
8183 - name : Run e2e test
8284 env :
@@ -89,25 +91,21 @@ jobs:
8991 # the test separately.
9092
9193 pytest -sv tests/e2e/singlecard/test_completion_with_prompt_embeds.py
92- pytest -sv tests/e2e/singlecard/test_aclgraph .py
94+ pytest -sv tests/e2e/singlecard/test_aclgraph_accuracy .py
9395 pytest -sv tests/e2e/singlecard/test_aclgraph_mem.py
94- pytest -sv tests/e2e/singlecard/test_bge_model.py
9596 pytest -sv tests/e2e/singlecard/test_camem.py
96- pytest -sv tests/e2e/singlecard/test_embedding.py
97- # pytest -sv tests/e2e/singlecard/test_embedding_aclgraph.py
9897 pytest -sv tests/e2e/singlecard/test_guided_decoding.py
9998 # torch 2.8 doesn't work with lora, fix me
10099 #pytest -sv tests/e2e/singlecard/test_ilama_lora.py
101100 pytest -sv tests/e2e/singlecard/test_profile_execute_duration.py
102101 pytest -sv tests/e2e/singlecard/test_quantization.py
103102 pytest -sv tests/e2e/singlecard/test_sampler.py
104103 pytest -sv tests/e2e/singlecard/test_vlm.py
105- pytest -sv tests/e2e/singlecard/multi-modal/test_internvl.py
106104 pytest -sv tests/e2e/singlecard/test_xlite.py
105+ pytest -sv tests/e2e/singlecard/pooling/
107106
108107 # ------------------------------------ v1 spec decode test ------------------------------------ #
109108 pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_correctness.py
110- pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_torchair_correctness.py
111109 pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py
112110
113111 e2e-2-cards :
@@ -119,6 +117,7 @@ jobs:
119117 VLLM_LOGGING_LEVEL : ERROR
120118 VLLM_USE_MODELSCOPE : True
121119 HCCL_BUFFSIZE : 1024
120+ TRANSFORMERS_OFFLINE : 1
122121 steps :
123122 - name : Check npu and CANN info
124123 run : |
@@ -170,10 +169,6 @@ jobs:
170169 if : ${{ inputs.type == 'light' }}
171170 run : |
172171 pytest -sv tests/e2e/multicard/test_qwen3_moe.py::test_models_distributed_Qwen3_MOE_TP2_WITH_EP
173- pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py::test_e2e_qwen3_moe_with_torchair
174- pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py::test_e2e_deepseekv2lite_with_torchair
175- pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py::test_e2e_deepseekv2lite_with_torchair_v1scheduler
176- pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py::test_e2e_deepseekv2lite_with_nz
177172
178173 - name : Run vllm-project/vllm-ascend test (full)
179174 env :
@@ -183,7 +178,6 @@ jobs:
183178 run : |
184179 pytest -sv tests/e2e/multicard/test_quantization.py
185180 pytest -sv tests/e2e/multicard/test_aclgraph_capture_replay.py
186- pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py
187181 pytest -sv tests/e2e/multicard/test_full_graph_mode.py
188182 pytest -sv tests/e2e/multicard/test_data_parallel.py
189183 pytest -sv tests/e2e/multicard/test_expert_parallel.py
@@ -220,6 +214,7 @@ jobs:
220214 env :
221215 VLLM_LOGGING_LEVEL : ERROR
222216 VLLM_USE_MODELSCOPE : True
217+ TRANSFORMERS_OFFLINE : 1
223218 steps :
224219 - name : Check npu and CANN info
225220 run : |
@@ -272,6 +267,7 @@ jobs:
272267 run : |
273268 pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek_multistream_moe
274269 pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek_W4A8DYNAMIC
270+ pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Kimi_K2_Thinking_W4A16
275271 # pytest -sv tests/e2e/multicard/test_qwen3_moe.py::test_models_distributed_Qwen3_MOE_TP2_WITH_EP
276272 # pytest -sv tests/e2e/multicard/test_qwen3_moe.py::test_models_distributed_Qwen3_MOE_W8A8_WITH_EP
277273 pytest -sv tests/e2e/multicard/test_data_parallel_tp2.py
0 commit comments