{ "current_gpu_type": "NVIDIA A10G", "current_gpu_total_memory": 22716.5, "memory_inference_first": 4286.0, "memory_inference": 4208.0, "token_generation_latency_sync": 64.72505264282226, "token_generation_latency_async": 64.4813310354948, "token_generation_throughput_sync": 0.015449968121592494, "token_generation_throughput_async": 0.015508364730398223, "token_generation_CO2_emissions": 4.161721770576098e-06, "token_generation_energy_consumption": 0.0031534097319298876, "inference_latency_sync": 47.56480026245117, "inference_latency_async": 47.13015556335449, "inference_throughput_sync": 0.0210239503683867, "inference_throughput_async": 0.02121783787994832, "inference_CO2_emissions": 3.2781412719702414e-06, "inference_energy_consumption": 1.0538887149448775e-05 }