{ | |
"current_gpu_type": "NVIDIA A10G", | |
"current_gpu_total_memory": 22716.5, | |
"memory_inference_first": 4286.0, | |
"memory_inference": 4208.0, | |
"token_generation_latency_sync": 64.72505264282226, | |
"token_generation_latency_async": 64.4813310354948, | |
"token_generation_throughput_sync": 0.015449968121592494, | |
"token_generation_throughput_async": 0.015508364730398223, | |
"token_generation_CO2_emissions": 4.161721770576098e-06, | |
"token_generation_energy_consumption": 0.0031534097319298876, | |
"inference_latency_sync": 47.56480026245117, | |
"inference_latency_async": 47.13015556335449, | |
"inference_throughput_sync": 0.0210239503683867, | |
"inference_throughput_async": 0.02121783787994832, | |
"inference_CO2_emissions": 3.2781412719702414e-06, | |
"inference_energy_consumption": 1.0538887149448775e-05 | |
} |