@@ -51,11 +51,11 @@ jobs:
51
51
vllm_verison : [main, v0.8.5.post1]
52
52
concurrency :
53
53
group : >
54
- ${{
55
- matrix.os == 'linux-arm64-npu-4'
56
- && github.event.pull_request.number
57
- && format('pr-{0}-limit-npu-4', github.event.pull_request.number)
58
- || format('job-{0}-{1}-{2}', matrix.os, matrix.vllm_verison, github.event.pull_request.number)
54
+ ${{
55
+ matrix.os == 'linux-arm64-npu-4'
56
+ && github.event.pull_request.number
57
+ && format('pr-{0}-limit-npu-4', github.event.pull_request.number)
58
+ || format('job-{0}-{1}-{2}', matrix.os, matrix.vllm_verison, github.event.pull_request.number)
59
59
}}
60
60
cancel-in-progress : false
61
61
name : vLLM Ascend test
@@ -157,8 +157,9 @@ jobs:
157
157
if : steps.filter_spec_decode.outputs.speculative_tests_changed == 'true' || github.event_name == 'schedule'
158
158
run : |
159
159
if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
160
+ VLLM_USE_MODELSCOPE=true pytest -sv tests/singlecard/spec_decode/e2e/test_v1_spec_decode.py
160
161
pytest -sv tests/singlecard/spec_decode/e2e/test_mtp_correctness.py # it needs a clean process
161
- pytest -sv tests/singlecard/spec_decode --ignore=tests/singlecard/spec_decode/e2e/test_mtp_correctness.py
162
+ pytest -sv tests/singlecard/spec_decode --ignore=tests/singlecard/spec_decode/e2e/test_mtp_correctness.py --ignore=tests/singlecard/spec_decode/e2e/test_v1_spec_decode.py
162
163
fi
163
164
164
165
- name : Run vllm-project/vllm test for V0 Engine
0 commit comments