|
{ |
|
"base_current_gpu_type": "NVIDIA A100-PCIE-40GB", |
|
"base_current_gpu_total_memory": 40339.3125, |
|
"base_perplexity": 82.86221313476562, |
|
"base_token_generation_latency_sync": 20.888434410095215, |
|
"base_token_generation_latency_async": 20.86069267243147, |
|
"base_token_generation_throughput_sync": 0.04787338200495811, |
|
"base_token_generation_throughput_async": 0.04793704675595715, |
|
"base_token_generation_CO2_emissions": null, |
|
"base_token_generation_energy_consumption": null, |
|
"base_inference_latency_sync": 40.887705612182614, |
|
"base_inference_latency_async": 17.732644081115723, |
|
"base_inference_throughput_sync": 0.024457229502798192, |
|
"base_inference_throughput_async": 0.05639316931110935, |
|
"base_inference_CO2_emissions": null, |
|
"base_inference_energy_consumption": null, |
|
"smashed_current_gpu_type": "NVIDIA A100-PCIE-40GB", |
|
"smashed_current_gpu_total_memory": 40339.3125, |
|
"smashed_perplexity": 92.91635131835938, |
|
"smashed_token_generation_latency_sync": 24.19665660858154, |
|
"smashed_token_generation_latency_async": 24.469297379255295, |
|
"smashed_token_generation_throughput_sync": 0.04132802379173914, |
|
"smashed_token_generation_throughput_async": 0.040867540432435345, |
|
"smashed_token_generation_CO2_emissions": null, |
|
"smashed_token_generation_energy_consumption": null, |
|
"smashed_inference_latency_sync": 52.49914817810058, |
|
"smashed_inference_latency_async": 26.189470291137695, |
|
"smashed_inference_throughput_sync": 0.019047928103662803, |
|
"smashed_inference_throughput_async": 0.038183284689740055, |
|
"smashed_inference_CO2_emissions": null, |
|
"smashed_inference_energy_consumption": null |
|
} |