|
{ |
|
"current_gpu_type": "Tesla T4", |
|
"current_gpu_total_memory": 15095.0625, |
|
"perplexity": 2.7251362800598145, |
|
"memory_inference_first": 1690.0, |
|
"memory_inference": 1690.0, |
|
"token_generation_latency_sync": 155.3000717163086, |
|
"token_generation_latency_async": 155.34533187747002, |
|
"token_generation_throughput_sync": 0.006439147058648696, |
|
"token_generation_throughput_async": 0.0064372710007711, |
|
"token_generation_CO2_emissions": 0.00020285744923935242, |
|
"token_generation_energy_consumption": 0.009233308010788546, |
|
"inference_latency_sync": 1166.3823852539062, |
|
"inference_latency_async": 429.13405895233154, |
|
"inference_throughput_sync": 0.0008573517678615431, |
|
"inference_throughput_async": 0.0023302741396041943, |
|
"inference_CO2_emissions": 0.000202412501568058, |
|
"inference_energy_consumption": 0.0006962767357209158 |
|
} |