273 lines
6.0 KiB
JSON
273 lines
6.0 KiB
JSON
[
|
|
{
|
|
"name": "single_threaded",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 394.2612773048821,
|
|
"latency_p50": 1.802,
|
|
"latency_p95": 1.84,
|
|
"latency_p99": 1.84,
|
|
"latency_p999": 1.84,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {}
|
|
},
|
|
{
|
|
"name": "multi_threaded_1",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 3590.5525338642337,
|
|
"latency_p50": 2.8725,
|
|
"latency_p95": 4.9171249999999995,
|
|
"latency_p99": 5.915125000000001,
|
|
"latency_p999": 11.257,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"threads": "1"
|
|
}
|
|
},
|
|
{
|
|
"name": "multi_threaded_4",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 3158.700202068685,
|
|
"latency_p50": 2.83425,
|
|
"latency_p95": 5.983750000000001,
|
|
"latency_p99": 9.629083,
|
|
"latency_p999": 13.0975,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"threads": "4"
|
|
}
|
|
},
|
|
{
|
|
"name": "multi_threaded_8",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 3264.1971800718075,
|
|
"latency_p50": 2.799334,
|
|
"latency_p95": 5.170167,
|
|
"latency_p99": 8.281,
|
|
"latency_p999": 10.929542,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"threads": "8"
|
|
}
|
|
},
|
|
{
|
|
"name": "multi_threaded_16",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 3597.266257507607,
|
|
"latency_p50": 2.859084,
|
|
"latency_p95": 5.105084000000001,
|
|
"latency_p99": 8.471042,
|
|
"latency_p999": 14.47975,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"threads": "16"
|
|
}
|
|
},
|
|
{
|
|
"name": "ef_search_50",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 673.8290389990807,
|
|
"latency_p50": 1.346,
|
|
"latency_p95": 1.349,
|
|
"latency_p99": 1.349,
|
|
"latency_p999": 1.349,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"ef_search": "50"
|
|
}
|
|
},
|
|
{
|
|
"name": "ef_search_100",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 596.1576449850057,
|
|
"latency_p50": 1.366,
|
|
"latency_p95": 1.375,
|
|
"latency_p99": 1.375,
|
|
"latency_p999": 1.375,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"ef_search": "100"
|
|
}
|
|
},
|
|
{
|
|
"name": "ef_search_200",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 571.8043285587672,
|
|
"latency_p50": 1.4,
|
|
"latency_p95": 1.411,
|
|
"latency_p99": 1.411,
|
|
"latency_p999": 1.411,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"ef_search": "200"
|
|
}
|
|
},
|
|
{
|
|
"name": "ef_search_400",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 434.02464598101585,
|
|
"latency_p50": 1.965,
|
|
"latency_p95": 1.981,
|
|
"latency_p99": 1.981,
|
|
"latency_p999": 1.981,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"ef_search": "400"
|
|
}
|
|
},
|
|
{
|
|
"name": "ef_search_800",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 434.0612572013698,
|
|
"latency_p50": 1.772,
|
|
"latency_p95": 1.821,
|
|
"latency_p99": 1.821,
|
|
"latency_p999": 1.821,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"ef_search": "800"
|
|
}
|
|
},
|
|
{
|
|
"name": "quantization_none",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 423.8023729012711,
|
|
"latency_p50": 1.7049999999999998,
|
|
"latency_p95": 1.771,
|
|
"latency_p99": 1.771,
|
|
"latency_p999": 1.771,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"quantization": "none"
|
|
}
|
|
},
|
|
{
|
|
"name": "quantization_scalar",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 411.3324982598064,
|
|
"latency_p50": 1.751,
|
|
"latency_p95": 1.824,
|
|
"latency_p99": 1.824,
|
|
"latency_p999": 1.824,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"quantization": "scalar"
|
|
}
|
|
},
|
|
{
|
|
"name": "quantization_binary",
|
|
"dataset": "synthetic",
|
|
"dimensions": 384,
|
|
"num_vectors": 50000,
|
|
"num_queries": 1000,
|
|
"k": 10,
|
|
"qps": 440.33957446794454,
|
|
"latency_p50": 1.7049999999999998,
|
|
"latency_p95": 1.752,
|
|
"latency_p99": 1.752,
|
|
"latency_p999": 1.752,
|
|
"recall_at_1": 1.0,
|
|
"recall_at_10": 1.0,
|
|
"recall_at_100": 1.0,
|
|
"memory_mb": 0.0,
|
|
"build_time_secs": 0.0,
|
|
"metadata": {
|
|
"quantization": "binary"
|
|
}
|
|
}
|
|
] |