|
{ |
|
"current_gpu_type": "NVIDIA A10G", |
|
"current_gpu_total_memory": 22716.5, |
|
"memory_inference_first": 4286.0, |
|
"memory_inference": 4208.0, |
|
"token_generation_latency_sync": 64.72505264282226, |
|
"token_generation_latency_async": 64.4813310354948, |
|
"token_generation_throughput_sync": 0.015449968121592494, |
|
"token_generation_throughput_async": 0.015508364730398223, |
|
"token_generation_CO2_emissions": 4.161721770576098e-06, |
|
"token_generation_energy_consumption": 0.0031534097319298876, |
|
"inference_latency_sync": 47.56480026245117, |
|
"inference_latency_async": 47.13015556335449, |
|
"inference_throughput_sync": 0.0210239503683867, |
|
"inference_throughput_async": 0.02121783787994832, |
|
"inference_CO2_emissions": 3.2781412719702414e-06, |
|
"inference_energy_consumption": 1.0538887149448775e-05 |
|
} |