Skip to content

Commit 539b9fd

Browse files
committed
add gemma-3-27b-it and qwen3_30B-A3B
1 parent 319ad22 commit 539b9fd

File tree

1 file changed

+120
-0
lines changed

1 file changed

+120
-0
lines changed

vllm-benchmarks/benchmarks/serving-tests.json

Lines changed: 120 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -117,5 +117,125 @@
117117
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
118118
"num_prompts": 200
119119
}
120+
},
121+
{
122+
"test_name": "serving_qwen3_30B-A3B_tp8_in200_out200",
123+
"qps_list": ["inf"],
124+
"server_parameters": {
125+
"model": "Qwen/Qwen3-30B-A3B",
126+
"tensor_parallel_size": 8,
127+
"swap_space": 16,
128+
"disable_log_stats": "",
129+
"disable_log_requests": "",
130+
"load_format": "dummy",
131+
"max_model_len": 8192
132+
},
133+
"client_parameters": {
134+
"model": "Qwen/Qwen3-30B-A3B",
135+
"backend": "vllm",
136+
"dataset_name": "random",
137+
"random_input_len": 200,
138+
"random_output_len": 200
139+
}
140+
},
141+
{
142+
"test_name": "serving_qwen3_30B-A3B_tp8_in1k_out2k",
143+
"qps_list": ["inf"],
144+
"server_parameters": {
145+
"model": "Qwen/Qwen3-30B-A3B",
146+
"tensor_parallel_size": 8,
147+
"swap_space": 16,
148+
"disable_log_stats": "",
149+
"disable_log_requests": "",
150+
"load_format": "dummy",
151+
"max_model_len": 8192
152+
},
153+
"client_parameters": {
154+
"model": "Qwen/Qwen3-30B-A3B",
155+
"backend": "vllm",
156+
"dataset_name": "random",
157+
"random_input_len": 1024,
158+
"random_output_len": 2048
159+
}
160+
},
161+
{
162+
"test_name": "serving_qwen3_30B-A3B_tp8_in5k_out1k",
163+
"qps_list": ["inf"],
164+
"server_parameters": {
165+
"model": "Qwen/Qwen3-30B-A3B",
166+
"tensor_parallel_size": 8,
167+
"swap_space": 16,
168+
"disable_log_stats": "",
169+
"disable_log_requests": "",
170+
"load_format": "dummy",
171+
"max_model_len": 8192
172+
},
173+
"client_parameters": {
174+
"model": "Qwen/Qwen3-30B-A3B",
175+
"backend": "vllm",
176+
"dataset_name": "random",
177+
"random_input_len": 5120,
178+
"random_output_len": 1024
179+
}
180+
},
181+
{
182+
"test_name": "serving_google/gemma_3_27b_it_tp8_in200_out200",
183+
"qps_list": ["inf"],
184+
"server_parameters": {
185+
"model": "google/gemma-3-27b-it",
186+
"tensor_parallel_size": 8,
187+
"swap_space": 16,
188+
"disable_log_stats": "",
189+
"disable_log_requests": "",
190+
"load_format": "dummy",
191+
"max_model_len": 8192
192+
},
193+
"client_parameters": {
194+
"model": "google/gemma-3-27b-it",
195+
"backend": "vllm",
196+
"dataset_name": "random",
197+
"random_input_len": 200,
198+
"random_output_len": 200
199+
}
200+
},
201+
{
202+
"test_name": "serving_google/gemma_3_27b_it_tp8_in1k_out2k",
203+
"qps_list": ["inf"],
204+
"server_parameters": {
205+
"model": "google/gemma-3-27b-it",
206+
"tensor_parallel_size": 8,
207+
"swap_space": 16,
208+
"disable_log_stats": "",
209+
"disable_log_requests": "",
210+
"load_format": "dummy",
211+
"max_model_len": 8192
212+
},
213+
"client_parameters": {
214+
"model": "google/gemma-3-27b-it",
215+
"backend": "vllm",
216+
"dataset_name": "random",
217+
"random_input_len": 1024,
218+
"random_output_len": 2048
219+
}
220+
},
221+
{
222+
"test_name": "serving_google/gemma_3_27b_it_tp8_in5k_out1k",
223+
"qps_list": ["inf"],
224+
"server_parameters": {
225+
"model": "google/gemma-3-27b-it",
226+
"tensor_parallel_size": 8,
227+
"swap_space": 16,
228+
"disable_log_stats": "",
229+
"disable_log_requests": "",
230+
"load_format": "dummy",
231+
"max_model_len": 8192
232+
},
233+
"client_parameters": {
234+
"model": "google/gemma-3-27b-it",
235+
"backend": "vllm",
236+
"dataset_name": "random",
237+
"random_input_len": 5120,
238+
"random_output_len": 1024
239+
}
120240
}
121241
]

0 commit comments

Comments
 (0)