Skip to content

Commit 7c418cf

Browse files
committed
revert test
Signed-off-by: wangli <wangli858794774@gmail.com>
1 parent 8ecd714 commit 7c418cf

File tree

3 files changed

+131
-0
lines changed

3 files changed

+131
-0
lines changed

benchmarks/tests/latency-tests.json

Lines changed: 21 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,25 @@
11
[
2+
{
3+
"test_name": "latency_qwen3_8B_tp1",
4+
"parameters": {
5+
"model": "Qwen/Qwen3-8B",
6+
"tensor_parallel_size": 1,
7+
"load_format": "dummy",
8+
"max_model_len": 16384,
9+
"num_iters_warmup": 5,
10+
"num_iters": 15
11+
}
12+
},
13+
{
14+
"test_name": "latency_qwen2_5_7B_tp1",
15+
"parameters": {
16+
"model": "Qwen/Qwen2.5-7B-Instruct",
17+
"tensor_parallel_size": 1,
18+
"load_format": "dummy",
19+
"num_iters_warmup": 5,
20+
"num_iters": 15
21+
}
22+
},
223
{
324
"test_name": "latency_qwen3_30B_A3B_tp4",
425
"parameters": {

benchmarks/tests/serving-tests.json

Lines changed: 75 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,79 @@
11
[
2+
{
3+
"test_name": "serving_qwen2_5vl_7B_tp1",
4+
"qps_list": [
5+
1,
6+
4,
7+
16,
8+
"inf"
9+
],
10+
"server_parameters": {
11+
"model": "Qwen/Qwen2.5-VL-7B-Instruct",
12+
"tensor_parallel_size": 1,
13+
"swap_space": 16,
14+
"disable_log_stats": "",
15+
"disable_log_requests": "",
16+
"trust_remote_code": "",
17+
"max_model_len": 16384
18+
},
19+
"client_parameters": {
20+
"model": "Qwen/Qwen2.5-VL-7B-Instruct",
21+
"endpoint_type": "openai-chat",
22+
"dataset_name": "hf",
23+
"hf_split": "train",
24+
"endpoint": "/v1/chat/completions",
25+
"dataset_path": "lmarena-ai/vision-arena-bench-v0.1",
26+
"num_prompts": 200
27+
}
28+
},
29+
{
30+
"test_name": "serving_qwen3_8B_tp1",
31+
"qps_list": [
32+
1,
33+
4,
34+
16,
35+
"inf"
36+
],
37+
"server_parameters": {
38+
"model": "Qwen/Qwen3-8B",
39+
"tensor_parallel_size": 1,
40+
"swap_space": 16,
41+
"disable_log_stats": "",
42+
"disable_log_requests": "",
43+
"load_format": "dummy"
44+
},
45+
"client_parameters": {
46+
"model": "Qwen/Qwen3-8B",
47+
"endpoint_type": "vllm",
48+
"dataset_name": "sharegpt",
49+
"dataset_path": "/github/home/.cache/datasets/ShareGPT_V3_unfiltered_cleaned_split.json",
50+
"num_prompts": 200
51+
}
52+
},
53+
{
54+
"test_name": "serving_qwen2_5_7B_tp1",
55+
"qps_list": [
56+
1,
57+
4,
58+
16,
59+
"inf"
60+
],
61+
"server_parameters": {
62+
"model": "Qwen/Qwen2.5-7B-Instruct",
63+
"tensor_parallel_size": 1,
64+
"swap_space": 16,
65+
"disable_log_stats": "",
66+
"disable_log_requests": "",
67+
"load_format": "dummy"
68+
},
69+
"client_parameters": {
70+
"model": "Qwen/Qwen2.5-7B-Instruct",
71+
"endpoint_type": "vllm",
72+
"dataset_name": "sharegpt",
73+
"dataset_path": "/github/home/.cache/datasets/ShareGPT_V3_unfiltered_cleaned_split.json",
74+
"num_prompts": 200
75+
}
76+
},
277
{
378
"test_name": "serving_qwen3_30B_A3B_tp1",
479
"qps_list": [

benchmarks/tests/throughput-tests.json

Lines changed: 35 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,39 @@
11
[
2+
{
3+
"test_name": "throughput_qwen3_8B_tp1",
4+
"parameters": {
5+
"model": "Qwen/Qwen3-8B",
6+
"tensor_parallel_size": 1,
7+
"load_format": "dummy",
8+
"dataset_path": "/github/home/.cache/datasets/ShareGPT_V3_unfiltered_cleaned_split.json",
9+
"num_prompts": 200,
10+
"backend": "vllm"
11+
}
12+
},
13+
{
14+
"test_name": "throughput_qwen2_5vl_7B_tp1",
15+
"parameters": {
16+
"model": "Qwen/Qwen2.5-VL-7B-Instruct",
17+
"tensor_parallel_size": 1,
18+
"backend": "vllm-chat",
19+
"dataset_name": "hf",
20+
"hf_split": "train",
21+
"max_model_len": 16384,
22+
"dataset_path": "lmarena-ai/vision-arena-bench-v0.1",
23+
"num_prompts": 200
24+
}
25+
},
26+
{
27+
"test_name": "throughput_qwen2_5_7B_tp1",
28+
"parameters": {
29+
"model": "Qwen/Qwen2.5-7B-Instruct",
30+
"tensor_parallel_size": 1,
31+
"load_format": "dummy",
32+
"dataset_path": "/github/home/.cache/datasets/ShareGPT_V3_unfiltered_cleaned_split.json",
33+
"num_prompts": 200,
34+
"backend": "vllm"
35+
}
36+
},
237
{
338
"test_name": "throughput_qwen3_30B_A3B_tp1",
439
"parameters": {

0 commit comments

Comments
 (0)