3030 - ' .github/workflows/vllm_ascend_test.yaml'
3131 - ' !docs/**'
3232 - ' pytest.ini'
33-
33+ types : [ labeled ]
3434# Bash shells do not use ~/.profile or ~/.bashrc so these shells need to be explicitly
3535# declared as "shell: bash -el {0}" on steps that need to be properly activated.
3636# It's used to activate ascend-toolkit environment variables.
@@ -48,14 +48,14 @@ jobs:
4848 max-parallel : 2
4949 matrix :
5050 os : [linux-arm64-npu-1, linux-arm64-npu-4]
51- vllm_verison : [main, v0.8.5.post1]
51+ vllm_version : [main, v0.8.5.post1]
5252 concurrency :
5353 group : >
5454 ${{
5555 matrix.os == 'linux-arm64-npu-4'
5656 && github.event.pull_request.number
5757 && format('pr-{0}-limit-npu-4', github.event.pull_request.number)
58- || format('job-{0}-{1}-{2}', matrix.os, matrix.vllm_verison , github.event.pull_request.number)
58+ || format('job-{0}-{1}-{2}', matrix.os, matrix.vllm_version , github.event.pull_request.number)
5959 }}
6060 cancel-in-progress : false
6161 name : vLLM Ascend test
6666 env :
6767 HF_ENDPOINT : https://hf-mirror.com
6868 HF_TOKEN : ${{ secrets.HF_TOKEN }}
69+ VLLM_LOGGING_LEVEL : ERROR
6970 steps :
7071 - name : Check npu and CANN info
7172 run : |
9293 uses : actions/checkout@v4
9394 with :
9495 repository : vllm-project/vllm
95- ref : ${{ matrix.vllm_verison }}
96+ ref : ${{ matrix.vllm_version }}
9697 path : ./vllm-empty
9798
9899 - name : Install vllm-project/vllm from source
@@ -112,58 +113,28 @@ jobs:
112113 run : |
113114 if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
114115 pytest -sv tests/singlecard/test_offline_inference.py
115- pytest -sv tests/singlecard/test_ilama_lora.py
116- pytest -sv tests/ops
117- pytest -sv tests/compile
116+ # AscendScheduler doesn't work, fix it later
117+ # pytest -sv tests/singlecard/tets_schedule.py
118+ # guided decoding doesn't work, fix it later
119+ # pytest -sv tests/singlecard/test_guided_decoding.py.py
120+ pytest -sv tests/singlecard/ --ignore=tests/singlecard/test_offline_inference.py --ignore=tests/singlecard/test_scheduler.py --ignore=tests/singlecard/test_guided_decoding.py
118121 else
119- pytest -sv -k "QwQ" tests/multicard/test_offline_inference_distributed.py
120- pytest -sv tests/multicard/test_ilama_lora_tp2.py
121- pytest -sv tests/ops
122- pytest -sv tests/compile
122+ pytest -sv tests/multicard/
123123 fi
124124
125125 - name : Run vllm-project/vllm-ascend test on V0 engine
126126 env :
127127 VLLM_USE_V1 : 0
128128 run : |
129129 if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
130- pytest -sv tests/singlecard/test_ilama_lora.py
131130 pytest -sv tests/singlecard/test_offline_inference.py
132- pytest -sv tests/ops
131+ # AscendScheduler doesn't work, fix it later
132+ # pytest -sv tests/singlecard/tets_schedule.py
133+ # guided decoding doesn't work, fix it later
134+ # pytest -sv tests/singlecard/test_guided_decoding.py.py
135+ pytest -sv tests/singlecard/ --ignore=tests/singlecard/test_offline_inference.py --ignore=tests/singlecard/test_scheduler.py --ignore=tests/singlecard/test_guided_decoding.py
133136 else
134- pytest -sv tests/multicard/test_ilama_lora_tp2.py
135- pytest -sv -k "QwQ" tests/multicard/test_offline_inference_distributed.py
136- pytest -sv -k "DeepSeek" tests/multicard/test_offline_inference_distributed.py
137- pytest -sv tests/ops
138- fi
139-
140- # only run test on spec decode when the related code changed
141- - name : Check for changes in Speculative Decode
142- if : github.event_name != 'schedule'
143- id : filter_spec_decode
144- uses : dorny/paths-filter@v3
145- with :
146- filters : |
147- speculative_tests_changed:
148- - ".github/workflows/vllm_ascend_test.yaml"
149- - "tests/singlecard/spec_decode/**"
150- - "tests/multicard/spec_decode_e2e/**"
151- - "vllm_ascend/worker/worker.py"
152- - "vllm_ascend/worker/model_runner.py"
153- - "vllm_ascend/worker/multi_step_runner.py"
154- - "vllm_ascend/worker/multi_step_worker.py"
155- - "vllm_ascend/worker/draft_model_runner.py"
156- - "vllm_ascend/patch/worker/patch_common/patch_metrics.py"
157- - "vllm_ascend/patch/worker/patch_common/patch_spec_decode_worker.py"
158- - "vllm_ascend/patch/worker/patch_common/patch_multi_step_worker.py"
159-
160- - name : Run vllm-project/vllm-ascend Speculative Decode test
161- if : steps.filter_spec_decode.outputs.speculative_tests_changed == 'true' || github.event_name == 'schedule'
162- run : |
163- if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
164- VLLM_USE_MODELSCOPE=true pytest -sv tests/singlecard/spec_decode/e2e/test_v1_spec_decode.py
165- pytest -sv tests/singlecard/spec_decode/e2e/test_mtp_correctness.py # it needs a clean process
166- pytest -sv tests/singlecard/spec_decode --ignore=tests/singlecard/spec_decode/e2e/test_mtp_correctness.py --ignore=tests/singlecard/spec_decode/e2e/test_v1_spec_decode.py
137+ pytest -sv tests/multicard/
167138 fi
168139
169140 - name : Run vllm-project/vllm test for V0 Engine
0 commit comments