{ | |
"current_gpu_type": "NVIDIA A10G", | |
"current_gpu_total_memory": 22716.5, | |
"memory_inference_first": 9396.0, | |
"memory_inference": 9396.0, | |
"token_generation_latency_sync": 41.4751594543457, | |
"token_generation_latency_async": 41.440220922231674, | |
"token_generation_throughput_sync": 0.024110817490666007, | |
"token_generation_throughput_async": 0.024131145484881433, | |
"token_generation_CO2_emissions": 2.7722372785106468e-06, | |
"token_generation_energy_consumption": 0.0013460853224844924, | |
"inference_latency_sync": 34.25094375610352, | |
"inference_latency_async": 27.751636505126953, | |
"inference_throughput_sync": 0.02919627579084737, | |
"inference_throughput_async": 0.036033911002518924, | |
"inference_CO2_emissions": 1.7203736862892723e-06, | |
"inference_energy_consumption": 9.17469136023194e-06 | |
} |