|
{ |
|
"current_gpu_type": "Tesla T4", |
|
"current_gpu_total_memory": 15095.0625, |
|
"perplexity": 30815030.0, |
|
"memory_inference_first": 1142.0, |
|
"memory_inference": 1142.0, |
|
"token_generation_latency_sync": 147.6204864501953, |
|
"token_generation_latency_async": 147.56362289190292, |
|
"token_generation_throughput_sync": 0.006774127521503482, |
|
"token_generation_throughput_async": 0.006776737927697435, |
|
"token_generation_CO2_emissions": 0.00020048614177282614, |
|
"token_generation_energy_consumption": 0.008781923951582248, |
|
"inference_latency_sync": 1151.6722137451172, |
|
"inference_latency_async": 424.6630907058716, |
|
"inference_throughput_sync": 0.0008683026194997837, |
|
"inference_throughput_async": 0.00235480789803938, |
|
"inference_CO2_emissions": 0.0002004475962713345, |
|
"inference_energy_consumption": 0.0006890801651842688 |
|
} |