|
{ |
|
"base_current_gpu_type": "NVIDIA A100-PCIE-40GB", |
|
"base_current_gpu_total_memory": 40339.3125, |
|
"base_perplexity": 8.891793251037598, |
|
"base_token_generation_latency_sync": 36.54602737426758, |
|
"base_token_generation_latency_async": 36.249685660004616, |
|
"base_token_generation_throughput_sync": 0.02736275518427784, |
|
"base_token_generation_throughput_async": 0.027586446110988778, |
|
"base_token_generation_CO2_emissions": null, |
|
"base_token_generation_energy_consumption": null, |
|
"base_inference_latency_sync": 119.13349075317383, |
|
"base_inference_latency_async": 39.10982608795166, |
|
"base_inference_throughput_sync": 0.00839394525987529, |
|
"base_inference_throughput_async": 0.025569021906442696, |
|
"base_inference_CO2_emissions": null, |
|
"base_inference_energy_consumption": null, |
|
"smashed_current_gpu_type": "NVIDIA A100-PCIE-40GB", |
|
"smashed_current_gpu_total_memory": 40339.3125, |
|
"smashed_perplexity": 9.47966194152832, |
|
"smashed_token_generation_latency_sync": 167.53070373535155, |
|
"smashed_token_generation_latency_async": 167.87611786276102, |
|
"smashed_token_generation_throughput_sync": 0.005969055090819061, |
|
"smashed_token_generation_throughput_async": 0.005956773439432889, |
|
"smashed_token_generation_CO2_emissions": null, |
|
"smashed_token_generation_energy_consumption": null, |
|
"smashed_inference_latency_sync": 265.20934295654297, |
|
"smashed_inference_latency_async": 196.3787078857422, |
|
"smashed_inference_throughput_sync": 0.003770606226960335, |
|
"smashed_inference_throughput_async": 0.005092201750211249, |
|
"smashed_inference_CO2_emissions": null, |
|
"smashed_inference_energy_consumption": null |
|
} |