[ { "name": "single_threaded", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 394.2612773048821, "latency_p50": 1.802, "latency_p95": 1.84, "latency_p99": 1.84, "latency_p999": 1.84, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": {} }, { "name": "multi_threaded_1", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 3590.5525338642337, "latency_p50": 2.8725, "latency_p95": 4.9171249999999995, "latency_p99": 5.915125000000001, "latency_p999": 11.257, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "threads": "1" } }, { "name": "multi_threaded_4", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 3158.700202068685, "latency_p50": 2.83425, "latency_p95": 5.983750000000001, "latency_p99": 9.629083, "latency_p999": 13.0975, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "threads": "4" } }, { "name": "multi_threaded_8", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 3264.1971800718075, "latency_p50": 2.799334, "latency_p95": 5.170167, "latency_p99": 8.281, "latency_p999": 10.929542, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "threads": "8" } }, { "name": "multi_threaded_16", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 3597.266257507607, "latency_p50": 2.859084, "latency_p95": 5.105084000000001, "latency_p99": 8.471042, "latency_p999": 14.47975, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "threads": "16" } }, { "name": "ef_search_50", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 673.8290389990807, "latency_p50": 1.346, "latency_p95": 1.349, "latency_p99": 1.349, "latency_p999": 1.349, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "ef_search": "50" } }, { "name": "ef_search_100", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 596.1576449850057, "latency_p50": 1.366, "latency_p95": 1.375, "latency_p99": 1.375, "latency_p999": 1.375, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "ef_search": "100" } }, { "name": "ef_search_200", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 571.8043285587672, "latency_p50": 1.4, "latency_p95": 1.411, "latency_p99": 1.411, "latency_p999": 1.411, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "ef_search": "200" } }, { "name": "ef_search_400", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 434.02464598101585, "latency_p50": 1.965, "latency_p95": 1.981, "latency_p99": 1.981, "latency_p999": 1.981, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "ef_search": "400" } }, { "name": "ef_search_800", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 434.0612572013698, "latency_p50": 1.772, "latency_p95": 1.821, "latency_p99": 1.821, "latency_p999": 1.821, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "ef_search": "800" } }, { "name": "quantization_none", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 423.8023729012711, "latency_p50": 1.7049999999999998, "latency_p95": 1.771, "latency_p99": 1.771, "latency_p999": 1.771, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "quantization": "none" } }, { "name": "quantization_scalar", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 411.3324982598064, "latency_p50": 1.751, "latency_p95": 1.824, "latency_p99": 1.824, "latency_p999": 1.824, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "quantization": "scalar" } }, { "name": "quantization_binary", "dataset": "synthetic", "dimensions": 384, "num_vectors": 50000, "num_queries": 1000, "k": 10, "qps": 440.33957446794454, "latency_p50": 1.7049999999999998, "latency_p95": 1.752, "latency_p99": 1.752, "latency_p999": 1.752, "recall_at_1": 1.0, "recall_at_10": 1.0, "recall_at_100": 1.0, "memory_mb": 0.0, "build_time_secs": 0.0, "metadata": { "quantization": "binary" } } ]