53
53
type : choice
54
54
options :
55
55
- all
56
- - Qwen/Qwen2.5-7B-Instruct
57
56
- Qwen/Qwen2.5-VL-7B-Instruct
58
57
- Qwen/Qwen3-8B-Base
58
+ - Qwen/Qwen3-30B-A3B
59
59
default : ' all'
60
60
61
61
# Bash shells do not use ~/.profile or ~/.bashrc so these shells need to be explicitly
@@ -77,48 +77,48 @@ jobs:
77
77
${{
78
78
(contains(github.event.pull_request.labels.*.name, 'accuracy-test') ||
79
79
contains(github.event.pull_request.labels.*.name, 'vl-accuracy-test') ||
80
+ contains(github.event.pull_request.labels.*.name, 'moe-accuracy-test') ||
80
81
contains(github.event.pull_request.labels.*.name, 'dense-accuracy-test')) &&
81
82
contains(github.event.pull_request.labels.*.name, 'ready-for-test') ||
82
83
github.event_name == 'workflow_dispatch' || github.event_name == 'schedule'
83
84
}}
84
85
runs-on : >-
85
86
${{
86
- (matrix.model_name == 'Qwen/Qwen2.5-VL-7B-Instruct ' && 'linux-arm64-npu-4') ||
87
+ (matrix.model_name == 'Qwen/Qwen3-30B-A3B ' && 'linux-arm64-npu-4') ||
87
88
'linux-arm64-npu-2'
88
89
}}
89
90
strategy :
90
91
matrix :
91
- vllm_use_version : [0, 1]
92
+ vllm_use_version : [1]
92
93
# the accuracy test will run:
93
94
# 1. workflow_dispatch with models input
94
- # - all: Qwen/Qwen2.5-7B-Instruct , Qwen/Qwen2.5-VL-7B-Instruct, Qwen/Qwen3-8B-Base
95
- # - specified but not all: Qwen/Qwen2.5-7B-Instruct , Qwen/Qwen2.5-VL-7B-Instruct, Qwen/Qwen3-8B-Base
95
+ # - all: Qwen/Qwen3-30B-A3B , Qwen/Qwen2.5-VL-7B-Instruct, Qwen/Qwen3-8B-Base
96
+ # - specified but not all: Qwen/Qwen3-30B-A3B , Qwen/Qwen2.5-VL-7B-Instruct, Qwen/Qwen3-8B-Base
96
97
# 2. PR labeled with "*-accuracy-test"
97
- # - accuracy-test: Qwen/Qwen2.5-7B-Instruct , Qwen/Qwen2.5-VL-7B-Instruct
98
- # - dense-accuracy-test: Qwen/Qwen2.5-7B-Instruct
98
+ # - accuracy-test: Qwen/Qwen3-8B-Base , Qwen/Qwen2.5-VL-7B-Instruct, Qwen/Qwen3-30B-A3B
99
+ # - dense-accuracy-test: Qwen/Qwen3-8B-Base
99
100
# - vl-accuracy-test: Qwen/Qwen2.5-VL-7B-Instruct
101
+ # - moe-accuracy-test: Qwen/Qwen3-30B-A3B
100
102
model_name : ${{ fromJSON(
101
103
(github.event_name == 'schedule' &&
102
- ' ["Qwen/Qwen2.5-7B-Instruct ","Qwen/Qwen2.5-VL-7B-Instruct","Qwen/Qwen3-8B-Base"]' ) ||
104
+ ' ["Qwen/Qwen3-30B-A3B ","Qwen/Qwen2.5-VL-7B-Instruct","Qwen/Qwen3-8B-Base"]' ) ||
103
105
(github.event.inputs.models == 'all' &&
104
- ' ["Qwen/Qwen2.5-7B-Instruct ","Qwen/Qwen2.5-VL-7B-Instruct","Qwen/Qwen3-8B-Base"]' ) ||
105
- (github.event.inputs.models == 'Qwen/Qwen2.5-7B-Instruct ' &&
106
- ' ["Qwen/Qwen2.5-7B-Instruct "]' ) ||
106
+ ' ["Qwen/Qwen3-30B-A3B ","Qwen/Qwen2.5-VL-7B-Instruct","Qwen/Qwen3-8B-Base"]' ) ||
107
+ (github.event.inputs.models == 'Qwen/Qwen3-30B-A3B ' &&
108
+ ' ["Qwen/Qwen3-30B-A3B "]' ) ||
107
109
(github.event.inputs.models == 'Qwen/Qwen2.5-VL-7B-Instruct' &&
108
110
' ["Qwen/Qwen2.5-VL-7B-Instruct"]' ) ||
109
111
(github.event.inputs.models == 'Qwen/Qwen3-8B-Base' &&
110
112
' ["Qwen/Qwen3-8B-Base"]' ) ||
111
113
contains(github.event.pull_request.labels.*.name, 'accuracy-test') &&
112
- ' ["Qwen/Qwen3-8B-Base","Qwen/Qwen2.5-VL-7B-Instruct"]' ||
114
+ ' ["Qwen/Qwen3-8B-Base","Qwen/Qwen2.5-VL-7B-Instruct", "Qwen/Qwen3-30B-A3B" ]' ||
113
115
contains(github.event.pull_request.labels.*.name, 'dense-accuracy-test') &&
114
116
' ["Qwen/Qwen3-8B-Base"]' ||
115
117
contains(github.event.pull_request.labels.*.name, 'vl-accuracy-test') &&
116
- ' ["Qwen/Qwen2.5-VL-7B-Instruct"]'
118
+ ' ["Qwen/Qwen2.5-VL-7B-Instruct"]' ||
119
+ contains(github.event.pull_request.labels.*.name, 'moe-accuracy-test') &&
120
+ ' ["Qwen/Qwen3-30B-A3B"]'
117
121
) }}
118
- # Remove exclude after https://github.com/vllm-project/vllm-ascend/issues/1044 resolved
119
- exclude :
120
- - model_name : Qwen/Qwen2.5-VL-7B-Instruct
121
- vllm_use_version : 1
122
122
123
123
fail-fast : false
124
124
name : ${{ matrix.model_name }} accuracy V${{ matrix.vllm_use_version }}
@@ -187,23 +187,19 @@ jobs:
187
187
- name : Get vLLM commit hash and URL
188
188
working-directory : ./vllm-empty
189
189
run : |
190
- VLLM_COMMIT=$(git rev-parse HEAD)
190
+ VLLM_COMMIT=$(git rev-parse --short=7 HEAD)
191
191
echo "VLLM_COMMIT=$VLLM_COMMIT" >> $GITHUB_ENV
192
- echo "VLLM_COMMIT_URL=https://github.com/vllm-project/vllm/commit/$VLLM_COMMIT" >> $GITHUB_ENV
193
192
194
193
- name : Get vLLM-Ascend commit hash and URL
195
194
working-directory : ./vllm-ascend
196
195
run : |
197
- VLLM_ASCEND_COMMIT=$(git rev-parse HEAD)
196
+ VLLM_ASCEND_COMMIT=$(git rev-parse --short=7 HEAD)
198
197
echo "VLLM_ASCEND_COMMIT=$VLLM_ASCEND_COMMIT" >> $GITHUB_ENV
199
- echo "VLLM_ASCEND_COMMIT_URL=https://github.com/vllm-project/vllm-ascend/commit/$VLLM_ASCEND_COMMIT" >> $GITHUB_ENV
200
198
201
- - name : Print resolved hashes and URLs
199
+ - name : Print resolved hashes
202
200
run : |
203
201
echo "vLLM : ${{ env.VLLM_COMMIT }}"
204
- echo "vLLM link : ${{ env.VLLM_COMMIT_URL }}"
205
202
echo "vLLM-Ascend: ${{ env.VLLM_ASCEND_COMMIT }}"
206
- echo "Ascend link: ${{ env.VLLM_ASCEND_COMMIT_URL }}"
207
203
208
204
- name : Install lm-eval, ray, and datasets
209
205
run : |
@@ -262,8 +258,6 @@ jobs:
262
258
--vllm_version "${{ env.GHA_VLLM_VERSION }}" \
263
259
--vllm_commit "${{ env.VLLM_COMMIT }}" \
264
260
--vllm_ascend_commit "${{ env.VLLM_ASCEND_COMMIT }}" \
265
- --vllm_commit_url "${{ env.VLLM_COMMIT_URL }}" \
266
- --vllm_ascend_commit_url "${{ env.VLLM_ASCEND_COMMIT_URL }}" \
267
261
--vllm_use_v1 "$VLLM_USE_V1"
268
262
269
263
- name : Generate step summary
@@ -385,7 +379,7 @@ jobs:
385
379
body: `The accuracy results running on NPU Altlas A2 have changed, updating reports for:
386
380
${{
387
381
github.event.inputs.models == 'all'
388
- && 'All models (Qwen2.5-7B-Instruct , Qwen2.5-VL-7B-Instruct, Qwen3-8B-Base)'
382
+ && 'All models (Qwen/Qwen3-30B-A3B , Qwen2.5-VL-7B-Instruct, Qwen3-8B-Base)'
389
383
|| github.event.inputs.models
390
384
}}
391
385
0 commit comments