git-subtree-dir: vendor/ruvector git-subtree-split: b64c21726f2bb37286d9ee36a7869fef60cc6900
216 lines
5.7 KiB
JSON
216 lines
5.7 KiB
JSON
{
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"results": [
|
|
{
|
|
"efficiency_percent": 0.9881420625225114,
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"iterations": 50,
|
|
"max_time_ms": 3.174368,
|
|
"mean_time_ms": 0.16471358,
|
|
"metadata": {
|
|
"bandwidth_gb_s": "5.93",
|
|
"size_mb": "1"
|
|
},
|
|
"min_time_ms": 0.040596,
|
|
"name": "memory_bandwidth_1MB",
|
|
"operation": "memory_transfer",
|
|
"std_time_ms": 0.5062852803394976,
|
|
"throughput": 5.928852375135068
|
|
},
|
|
{
|
|
"efficiency_percent": 0.713928028478,
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"iterations": 50,
|
|
"max_time_ms": 17.299856,
|
|
"mean_time_ms": 2.2797874599999997,
|
|
"metadata": {
|
|
"bandwidth_gb_s": "4.28",
|
|
"size_mb": "10"
|
|
},
|
|
"min_time_ms": 0.37521899999999997,
|
|
"name": "memory_bandwidth_10MB",
|
|
"operation": "memory_transfer",
|
|
"std_time_ms": 3.4558740220220883,
|
|
"throughput": 4.283568170868
|
|
},
|
|
{
|
|
"efficiency_percent": 0.08924861363335496,
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"iterations": 50,
|
|
"max_time_ms": 330.599246,
|
|
"mean_time_ms": 182.36744532,
|
|
"metadata": {
|
|
"bandwidth_gb_s": "0.54",
|
|
"size_mb": "100"
|
|
},
|
|
"min_time_ms": 104.69545500000001,
|
|
"name": "memory_bandwidth_100MB",
|
|
"operation": "memory_transfer",
|
|
"std_time_ms": 55.7021010042311,
|
|
"throughput": 0.5354916818001297
|
|
},
|
|
{
|
|
"efficiency_percent": 0.1439795903913544,
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"iterations": 50,
|
|
"max_time_ms": 1279.9928280000001,
|
|
"mean_time_ms": 565.2204462599999,
|
|
"metadata": {
|
|
"bandwidth_gb_s": "0.86",
|
|
"size_mb": "500"
|
|
},
|
|
"min_time_ms": 199.191355,
|
|
"name": "memory_bandwidth_500MB",
|
|
"operation": "memory_transfer",
|
|
"std_time_ms": 243.53272527540335,
|
|
"throughput": 0.8638775423481264
|
|
},
|
|
{
|
|
"efficiency_percent": null,
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"iterations": 20,
|
|
"max_time_ms": 16.490006,
|
|
"mean_time_ms": 8.214337000000002,
|
|
"metadata": {
|
|
"matrix_size": "128",
|
|
"tflops": "0.001"
|
|
},
|
|
"min_time_ms": 3.316313,
|
|
"name": "gemm_128x128",
|
|
"operation": "gemm",
|
|
"std_time_ms": 4.271369656748477,
|
|
"throughput": 0.0005106077337708447
|
|
},
|
|
{
|
|
"efficiency_percent": null,
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"iterations": 20,
|
|
"max_time_ms": 175.19369,
|
|
"mean_time_ms": 85.41927405,
|
|
"metadata": {
|
|
"matrix_size": "256",
|
|
"tflops": "0.000"
|
|
},
|
|
"min_time_ms": 37.718396,
|
|
"name": "gemm_256x256",
|
|
"operation": "gemm",
|
|
"std_time_ms": 38.2258611390462,
|
|
"throughput": 0.00039282038360989797
|
|
},
|
|
{
|
|
"efficiency_percent": null,
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"iterations": 20,
|
|
"max_time_ms": 1099.584508,
|
|
"mean_time_ms": 720.2384636500001,
|
|
"metadata": {
|
|
"matrix_size": "512",
|
|
"tflops": "0.000"
|
|
},
|
|
"min_time_ms": 416.415041,
|
|
"name": "gemm_512x512",
|
|
"operation": "gemm",
|
|
"std_time_ms": 183.51006806750456,
|
|
"throughput": 0.0003727035829767156
|
|
},
|
|
{
|
|
"efficiency_percent": 0.0,
|
|
"gpu_info": {
|
|
"available": false,
|
|
"compute_capability": "N/A",
|
|
"cuda_version": "N/A",
|
|
"driver_version": "N/A",
|
|
"max_threads_per_block": 0,
|
|
"memory_gb": 0.0,
|
|
"name": "N/A",
|
|
"num_sms": 0
|
|
},
|
|
"iterations": 50,
|
|
"max_time_ms": 383.561285,
|
|
"mean_time_ms": 236.66858410000003,
|
|
"metadata": {
|
|
"batch_size": "64",
|
|
"dims": "128",
|
|
"num_vectors": "10000"
|
|
},
|
|
"min_time_ms": 121.239973,
|
|
"name": "l2_distance_128d_10000v",
|
|
"operation": "l2_distance",
|
|
"std_time_ms": 62.27295731680189,
|
|
"throughput": 2704203.443113428
|
|
}
|
|
],
|
|
"timestamp": "2025-12-02T00:16:10.163679757+00:00"
|
|
} |