Skip to content

Commit c922df1

Browse files
committed
test new nodel
Signed-off-by: wangli <wangli858794774@gmail.com>
1 parent 892e873 commit c922df1

File tree

3 files changed

+0
-131
lines changed

3 files changed

+0
-131
lines changed

benchmarks/tests/latency-tests.json

Lines changed: 0 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -1,25 +1,4 @@
11
[
2-
{
3-
"test_name": "latency_qwen3_8B_tp1",
4-
"parameters": {
5-
"model": "Qwen/Qwen3-8B",
6-
"tensor_parallel_size": 1,
7-
"load_format": "dummy",
8-
"max_model_len": 16384,
9-
"num_iters_warmup": 5,
10-
"num_iters": 15
11-
}
12-
},
13-
{
14-
"test_name": "latency_qwen2_5_7B_tp1",
15-
"parameters": {
16-
"model": "Qwen/Qwen2.5-7B-Instruct",
17-
"tensor_parallel_size": 1,
18-
"load_format": "dummy",
19-
"num_iters_warmup": 5,
20-
"num_iters": 15
21-
}
22-
},
232
{
243
"test_name": "latency_qwen3_30B_A3B_tp4",
254
"parameters": {

benchmarks/tests/serving-tests.json

Lines changed: 0 additions & 75 deletions
Original file line numberDiff line numberDiff line change
@@ -1,79 +1,4 @@
11
[
2-
{
3-
"test_name": "serving_qwen2_5vl_7B_tp1",
4-
"qps_list": [
5-
1,
6-
4,
7-
16,
8-
"inf"
9-
],
10-
"server_parameters": {
11-
"model": "Qwen/Qwen2.5-VL-7B-Instruct",
12-
"tensor_parallel_size": 1,
13-
"swap_space": 16,
14-
"disable_log_stats": "",
15-
"disable_log_requests": "",
16-
"trust_remote_code": "",
17-
"max_model_len": 16384
18-
},
19-
"client_parameters": {
20-
"model": "Qwen/Qwen2.5-VL-7B-Instruct",
21-
"endpoint_type": "openai-chat",
22-
"dataset_name": "hf",
23-
"hf_split": "train",
24-
"endpoint": "/v1/chat/completions",
25-
"dataset_path": "lmarena-ai/vision-arena-bench-v0.1",
26-
"num_prompts": 200
27-
}
28-
},
29-
{
30-
"test_name": "serving_qwen3_8B_tp1",
31-
"qps_list": [
32-
1,
33-
4,
34-
16,
35-
"inf"
36-
],
37-
"server_parameters": {
38-
"model": "Qwen/Qwen3-8B",
39-
"tensor_parallel_size": 1,
40-
"swap_space": 16,
41-
"disable_log_stats": "",
42-
"disable_log_requests": "",
43-
"load_format": "dummy"
44-
},
45-
"client_parameters": {
46-
"model": "Qwen/Qwen3-8B",
47-
"endpoint_type": "vllm",
48-
"dataset_name": "sharegpt",
49-
"dataset_path": "/github/home/.cache/datasets/ShareGPT_V3_unfiltered_cleaned_split.json",
50-
"num_prompts": 200
51-
}
52-
},
53-
{
54-
"test_name": "serving_qwen2_5_7B_tp1",
55-
"qps_list": [
56-
1,
57-
4,
58-
16,
59-
"inf"
60-
],
61-
"server_parameters": {
62-
"model": "Qwen/Qwen2.5-7B-Instruct",
63-
"tensor_parallel_size": 1,
64-
"swap_space": 16,
65-
"disable_log_stats": "",
66-
"disable_log_requests": "",
67-
"load_format": "dummy"
68-
},
69-
"client_parameters": {
70-
"model": "Qwen/Qwen2.5-7B-Instruct",
71-
"endpoint_type": "vllm",
72-
"dataset_name": "sharegpt",
73-
"dataset_path": "/github/home/.cache/datasets/ShareGPT_V3_unfiltered_cleaned_split.json",
74-
"num_prompts": 200
75-
}
76-
},
772
{
783
"test_name": "serving_qwen3_30B_A3B_tp1",
794
"qps_list": [

benchmarks/tests/throughput-tests.json

Lines changed: 0 additions & 35 deletions
Original file line numberDiff line numberDiff line change
@@ -1,39 +1,4 @@
11
[
2-
{
3-
"test_name": "throughput_qwen3_8B_tp1",
4-
"parameters": {
5-
"model": "Qwen/Qwen3-8B",
6-
"tensor_parallel_size": 1,
7-
"load_format": "dummy",
8-
"dataset_path": "/github/home/.cache/datasets/ShareGPT_V3_unfiltered_cleaned_split.json",
9-
"num_prompts": 200,
10-
"backend": "vllm"
11-
}
12-
},
13-
{
14-
"test_name": "throughput_qwen2_5vl_7B_tp1",
15-
"parameters": {
16-
"model": "Qwen/Qwen2.5-VL-7B-Instruct",
17-
"tensor_parallel_size": 1,
18-
"backend": "vllm-chat",
19-
"dataset_name": "hf",
20-
"hf_split": "train",
21-
"max_model_len": 16384,
22-
"dataset_path": "lmarena-ai/vision-arena-bench-v0.1",
23-
"num_prompts": 200
24-
}
25-
},
26-
{
27-
"test_name": "throughput_qwen2_5_7B_tp1",
28-
"parameters": {
29-
"model": "Qwen/Qwen2.5-7B-Instruct",
30-
"tensor_parallel_size": 1,
31-
"load_format": "dummy",
32-
"dataset_path": "/github/home/.cache/datasets/ShareGPT_V3_unfiltered_cleaned_split.json",
33-
"num_prompts": 200,
34-
"backend": "vllm"
35-
}
36-
},
372
{
383
"test_name": "throughput_qwen3_30B_A3B_tp1",
394
"parameters": {

0 commit comments

Comments
 (0)