File size: 1,610 Bytes
2918d72 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 |
{
"base_current_gpu_type": "NVIDIA A100-PCIE-40GB",
"base_current_gpu_total_memory": 40339.3125,
"base_token_generation_latency_sync": 58.560171890258786,
"base_token_generation_latency_async": 58.45238883048296,
"base_token_generation_throughput_sync": 0.017076452607994227,
"base_token_generation_throughput_async": 0.017107940667747342,
"base_token_generation_CO2_emissions": null,
"base_token_generation_energy_consumption": null,
"base_inference_latency_sync": 55.90609893798828,
"base_inference_latency_async": 55.28888702392578,
"base_inference_throughput_sync": 0.017887136090629613,
"base_inference_throughput_async": 0.01808681733034812,
"base_inference_CO2_emissions": null,
"base_inference_energy_consumption": null,
"smashed_current_gpu_type": "NVIDIA A100-PCIE-40GB",
"smashed_current_gpu_total_memory": 40339.3125,
"smashed_token_generation_latency_sync": 175.9563995361328,
"smashed_token_generation_latency_async": 174.2004169151187,
"smashed_token_generation_throughput_sync": 0.005683226086895743,
"smashed_token_generation_throughput_async": 0.005740514389740309,
"smashed_token_generation_CO2_emissions": null,
"smashed_token_generation_energy_consumption": null,
"smashed_inference_latency_sync": 178.78282165527344,
"smashed_inference_latency_async": 156.2723159790039,
"smashed_inference_throughput_sync": 0.00559337855136992,
"smashed_inference_throughput_async": 0.006399086068029834,
"smashed_inference_CO2_emissions": null,
"smashed_inference_energy_consumption": null
} |