|
{ |
|
"base_current_gpu_type": "NVIDIA A100-PCIE-40GB", |
|
"base_current_gpu_total_memory": 40339.3125, |
|
"base_perplexity": 8.405904769897461, |
|
"base_token_generation_latency_sync": 38.60344696044922, |
|
"base_token_generation_latency_async": 38.134160824120045, |
|
"base_token_generation_throughput_sync": 0.025904422499486643, |
|
"base_token_generation_throughput_async": 0.026223207181931614, |
|
"base_token_generation_CO2_emissions": null, |
|
"base_token_generation_energy_consumption": null, |
|
"base_inference_latency_sync": 120.48721923828126, |
|
"base_inference_latency_async": 39.444828033447266, |
|
"base_inference_throughput_sync": 0.008299635482684288, |
|
"base_inference_throughput_async": 0.025351866134440983, |
|
"base_inference_CO2_emissions": null, |
|
"base_inference_energy_consumption": null, |
|
"smashed_current_gpu_type": "NVIDIA A100-PCIE-40GB", |
|
"smashed_current_gpu_total_memory": 40339.3125, |
|
"smashed_perplexity": 9.43250846862793, |
|
"smashed_token_generation_latency_sync": 62.9321174621582, |
|
"smashed_token_generation_latency_async": 62.363552674651146, |
|
"smashed_token_generation_throughput_sync": 0.015890137505722914, |
|
"smashed_token_generation_throughput_async": 0.016035006940944674, |
|
"smashed_token_generation_CO2_emissions": null, |
|
"smashed_token_generation_energy_consumption": null, |
|
"smashed_inference_latency_sync": 198.10078887939454, |
|
"smashed_inference_latency_async": 111.86470985412598, |
|
"smashed_inference_throughput_sync": 0.005047935475960212, |
|
"smashed_inference_throughput_async": 0.008939369719941363, |
|
"smashed_inference_CO2_emissions": null, |
|
"smashed_inference_energy_consumption": null |
|
} |