Files
wifi-densepose/vendor/ruvector/bench_results/latency_benchmark.json

273 lines
6.0 KiB
JSON

[
{
"name": "single_threaded",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 394.2612773048821,
"latency_p50": 1.802,
"latency_p95": 1.84,
"latency_p99": 1.84,
"latency_p999": 1.84,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {}
},
{
"name": "multi_threaded_1",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 3590.5525338642337,
"latency_p50": 2.8725,
"latency_p95": 4.9171249999999995,
"latency_p99": 5.915125000000001,
"latency_p999": 11.257,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"threads": "1"
}
},
{
"name": "multi_threaded_4",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 3158.700202068685,
"latency_p50": 2.83425,
"latency_p95": 5.983750000000001,
"latency_p99": 9.629083,
"latency_p999": 13.0975,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"threads": "4"
}
},
{
"name": "multi_threaded_8",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 3264.1971800718075,
"latency_p50": 2.799334,
"latency_p95": 5.170167,
"latency_p99": 8.281,
"latency_p999": 10.929542,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"threads": "8"
}
},
{
"name": "multi_threaded_16",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 3597.266257507607,
"latency_p50": 2.859084,
"latency_p95": 5.105084000000001,
"latency_p99": 8.471042,
"latency_p999": 14.47975,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"threads": "16"
}
},
{
"name": "ef_search_50",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 673.8290389990807,
"latency_p50": 1.346,
"latency_p95": 1.349,
"latency_p99": 1.349,
"latency_p999": 1.349,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"ef_search": "50"
}
},
{
"name": "ef_search_100",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 596.1576449850057,
"latency_p50": 1.366,
"latency_p95": 1.375,
"latency_p99": 1.375,
"latency_p999": 1.375,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"ef_search": "100"
}
},
{
"name": "ef_search_200",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 571.8043285587672,
"latency_p50": 1.4,
"latency_p95": 1.411,
"latency_p99": 1.411,
"latency_p999": 1.411,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"ef_search": "200"
}
},
{
"name": "ef_search_400",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 434.02464598101585,
"latency_p50": 1.965,
"latency_p95": 1.981,
"latency_p99": 1.981,
"latency_p999": 1.981,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"ef_search": "400"
}
},
{
"name": "ef_search_800",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 434.0612572013698,
"latency_p50": 1.772,
"latency_p95": 1.821,
"latency_p99": 1.821,
"latency_p999": 1.821,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"ef_search": "800"
}
},
{
"name": "quantization_none",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 423.8023729012711,
"latency_p50": 1.7049999999999998,
"latency_p95": 1.771,
"latency_p99": 1.771,
"latency_p999": 1.771,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"quantization": "none"
}
},
{
"name": "quantization_scalar",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 411.3324982598064,
"latency_p50": 1.751,
"latency_p95": 1.824,
"latency_p99": 1.824,
"latency_p999": 1.824,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"quantization": "scalar"
}
},
{
"name": "quantization_binary",
"dataset": "synthetic",
"dimensions": 384,
"num_vectors": 50000,
"num_queries": 1000,
"k": 10,
"qps": 440.33957446794454,
"latency_p50": 1.7049999999999998,
"latency_p95": 1.752,
"latency_p99": 1.752,
"latency_p999": 1.752,
"recall_at_1": 1.0,
"recall_at_10": 1.0,
"recall_at_100": 1.0,
"memory_mb": 0.0,
"build_time_secs": 0.0,
"metadata": {
"quantization": "binary"
}
}
]