Skip to content

Commit 1bbd404

Browse files
alwayslove2013XuanYang-cn
authored andcommitted
update leaderboard data: use 90p search stage results as streaming performance
Signed-off-by: min.tian <min.tian.cn@gmail.com>
1 parent 3c42ffe commit 1bbd404

2 files changed

Lines changed: 33 additions & 71 deletions

File tree

vectordb_bench/results/getLeaderboardDataV2.py

Lines changed: 5 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -57,17 +57,9 @@ def main():
5757
)
5858
else:
5959
case: StreamingPerformanceCase = case
60-
# only use streaming-results (reading while inserting), exclude streaming-final or streaming-optimized results.
61-
qps_list = [
62-
qps
63-
for i, qps in enumerate(case_result.metrics.st_max_qps_list_list)
64-
if case_result.metrics.st_search_stage_list[i] < 100
65-
]
66-
latency_list = [
67-
latency
68-
for i, latency in enumerate(case_result.metrics.st_serial_latency_p99_list)
69-
if case_result.metrics.st_search_stage_list[i] < 100
70-
]
60+
# use 90p search stage results to represent streaming performance
61+
qps_90p = metrics.st_max_qps_list_list[metrics.st_search_stage_list.index(90)]
62+
latency_90p = metrics.st_serial_latency_p99_list[metrics.st_search_stage_list.index(90)]
7163
insert_rate = case.insert_rate
7264
streaming_data.append(
7365
{
@@ -76,10 +68,8 @@ def main():
7668
"label": label,
7769
"db_name": db_name,
7870
"insert_rate": insert_rate,
79-
"qps_avg": round(np.mean(qps_list), 4),
80-
"qps_std": round(np.std(qps_list), 4),
81-
"latency_avg": round(np.mean(latency_list), 4),
82-
"latency_std": round(np.std(latency_list), 4),
71+
"streaming_qps": round(qps_90p, 4),
72+
"streaming_latency": round(latency_90p, 4),
8373
}
8474
)
8575
save_to_json(data, config.RESULTS_LOCAL_DIR / "leaderboard_v2.json")

vectordb_bench/results/leaderboard_v2_streaming.json

Lines changed: 28 additions & 56 deletions
Original file line numberDiff line numberDiff line change
@@ -5,152 +5,124 @@
55
"label": "8c60g",
66
"db_name": "ElasticCloud-8c60g",
77
"insert_rate": 500,
8-
"qps_avg": 73.0943,
9-
"qps_std": 11.9516,
10-
"latency_avg": 0.0741,
11-
"latency_std": 0.0254
8+
"streaming_qps": 61.6708,
9+
"streaming_latency": 0.0794
1210
},
1311
{
1412
"dataset": "Cohere (Large)",
1513
"db": "ElasticCloud",
1614
"label": "8c60g",
1715
"db_name": "ElasticCloud-8c60g",
1816
"insert_rate": 1000,
19-
"qps_avg": 65.0504,
20-
"qps_std": 7.1721,
21-
"latency_avg": 0.1216,
22-
"latency_std": 0.0886
17+
"streaming_qps": 61.8172,
18+
"streaming_latency": 0.2223
2319
},
2420
{
2521
"dataset": "Cohere (Large)",
2622
"db": "Milvus",
2723
"label": "16c64g-sq8",
2824
"db_name": "Milvus-16c64g-sq8",
2925
"insert_rate": 500,
30-
"qps_avg": 551.4718,
31-
"qps_std": 224.6286,
32-
"latency_avg": 0.0069,
33-
"latency_std": 0.0022
26+
"streaming_qps": 305.9971,
27+
"streaming_latency": 0.005
3428
},
3529
{
3630
"dataset": "Cohere (Large)",
3731
"db": "Milvus",
3832
"label": "16c64g-sq8",
3933
"db_name": "Milvus-16c64g-sq8",
4034
"insert_rate": 1000,
41-
"qps_avg": 308.8962,
42-
"qps_std": 138.3864,
43-
"latency_avg": 0.0155,
44-
"latency_std": 0.0104
35+
"streaming_qps": 155.9613,
36+
"streaming_latency": 0.0203
4537
},
4638
{
4739
"dataset": "Cohere (Large)",
4840
"db": "Pinecone",
4941
"label": "p2.x8-1node",
5042
"db_name": "Pinecone-p2.x8-1node",
5143
"insert_rate": 500,
52-
"qps_avg": 378.1992,
53-
"qps_std": 14.4105,
54-
"latency_avg": 0.8718,
55-
"latency_std": 0.6552
44+
"streaming_qps": 367.4299,
45+
"streaming_latency": 1.8286
5646
},
5747
{
5848
"dataset": "Cohere (Large)",
5949
"db": "Pinecone",
6050
"label": "p2.x8-1node",
6151
"db_name": "Pinecone-p2.x8-1node",
6252
"insert_rate": 1000,
63-
"qps_avg": 381.9444,
64-
"qps_std": 22.3178,
65-
"latency_avg": 3.3114,
66-
"latency_std": 1.9718
53+
"streaming_qps": 369.6771,
54+
"streaming_latency": 5.992
6755
},
6856
{
6957
"dataset": "Cohere (Large)",
7058
"db": "QdrantCloud",
7159
"label": "16c64g",
7260
"db_name": "QdrantCloud-16c64g",
7361
"insert_rate": 500,
74-
"qps_avg": 622.5787,
75-
"qps_std": 174.3233,
76-
"latency_avg": 0.0097,
77-
"latency_std": 0.0025
62+
"streaming_qps": 393.753,
63+
"streaming_latency": 0.0162
7864
},
7965
{
8066
"dataset": "Cohere (Large)",
8167
"db": "QdrantCloud",
8268
"label": "16c64g",
8369
"db_name": "QdrantCloud-16c64g",
8470
"insert_rate": 1000,
85-
"qps_avg": 506.718,
86-
"qps_std": 125.8131,
87-
"latency_avg": 0.0116,
88-
"latency_std": 0.0012
71+
"streaming_qps": 347.5774,
72+
"streaming_latency": 0.0118
8973
},
9074
{
9175
"dataset": "Cohere (Large)",
9276
"db": "OpenSearch",
9377
"label": "16c128g",
9478
"db_name": "OpenSearch-16c128g",
9579
"insert_rate": 1000,
96-
"qps_avg": 181.1849,
97-
"qps_std": 33.7733,
98-
"latency_avg": 0.0698,
99-
"latency_std": 0.0188
80+
"streaming_qps": 149.7168,
81+
"streaming_latency": 0.098
10082
},
10183
{
10284
"dataset": "Cohere (Large)",
10385
"db": "OpenSearch",
10486
"label": "16c128g",
10587
"db_name": "OpenSearch-16c128g",
10688
"insert_rate": 500,
107-
"qps_avg": 216.7565,
108-
"qps_std": 45.1945,
109-
"latency_avg": 0.0476,
110-
"latency_std": 0.0119
89+
"streaming_qps": 161.6694,
90+
"streaming_latency": 0.052
11191
},
11292
{
11393
"dataset": "Cohere (Large)",
11494
"db": "ZillizCloud",
11595
"label": "8cu-perf",
11696
"db_name": "ZillizCloud-8cu-perf",
11797
"insert_rate": 500,
118-
"qps_avg": 2692.8245,
119-
"qps_std": 396.4151,
120-
"latency_avg": 0.0049,
121-
"latency_std": 0.0013
98+
"streaming_qps": 2118.7516,
99+
"streaming_latency": 0.0068
122100
},
123101
{
124102
"dataset": "Cohere (Large)",
125103
"db": "ZillizCloud",
126104
"label": "8cu-perf",
127105
"db_name": "ZillizCloud-8cu-perf",
128106
"insert_rate": 1000,
129-
"qps_avg": 2166.0034,
130-
"qps_std": 318.8514,
131-
"latency_avg": 0.0124,
132-
"latency_std": 0.0095
107+
"streaming_qps": 1860.2575,
108+
"streaming_latency": 0.0101
133109
},
134110
{
135111
"dataset": "Cohere (Large)",
136112
"db": "S3Vectors",
137113
"label": "",
138114
"db_name": "S3Vectors",
139115
"insert_rate": 500,
140-
"qps_avg": 192.4737,
141-
"qps_std": 5.2065,
142-
"latency_avg": 0.4781,
143-
"latency_std": 0.1369
116+
"streaming_qps": 180.9549,
117+
"streaming_latency": 0.4204
144118
},
145119
{
146120
"dataset": "Cohere (Large)",
147121
"db": "S3Vectors",
148122
"label": "",
149123
"db_name": "S3Vectors",
150124
"insert_rate": 1000,
151-
"qps_avg": 188.4833,
152-
"qps_std": 8.091,
153-
"latency_avg": 0.4486,
154-
"latency_std": 0.0365
125+
"streaming_qps": 167.2689,
126+
"streaming_latency": 0.5048
155127
}
156128
]

0 commit comments

Comments
 (0)