{ "current_gpu_type": "NVIDIA A100-PCIE-40GB", "current_gpu_total_memory": 40339.3125, "perplexity": 7.971606254577637, "token_generation_latency_sync": 51.49340744018555, "token_generation_latency_async": 51.413884572684765, "token_generation_throughput_sync": 0.019419961694350764, "token_generation_throughput_async": 0.019449998931441982, "token_generation_CO2_emissions": null, "token_generation_energy_consumption": null, "inference_latency_sync": 183.4039321899414, "inference_latency_async": 104.15270328521729, "inference_throughput_sync": 0.005452445801240264, "inference_throughput_async": 0.009601287037759807, "inference_CO2_emissions": null, "inference_energy_consumption": null }