{ "base_current_gpu_type": "NVIDIA A100-PCIE-40GB", "base_current_gpu_total_memory": 40339.3125, "base_perplexity": 6.637787342071533, "base_token_generation_latency_sync": 37.664760208129884, "base_token_generation_latency_async": 37.534007616341114, "base_token_generation_throughput_sync": 0.026550016367398815, "base_token_generation_throughput_async": 0.026642505383960964, "base_token_generation_CO2_emissions": null, "base_token_generation_energy_consumption": null, "base_inference_latency_sync": 118.52748794555664, "base_inference_latency_async": 38.34338188171387, "base_inference_throughput_sync": 0.00843686150219712, "base_inference_throughput_async": 0.026080119982241433, "base_inference_CO2_emissions": null, "base_inference_energy_consumption": null, "smashed_current_gpu_type": "NVIDIA A100-PCIE-40GB", "smashed_current_gpu_total_memory": 40339.3125, "smashed_perplexity": 7.146455764770508, "smashed_token_generation_latency_sync": 44.163258743286136, "smashed_token_generation_latency_async": 44.04097441583872, "smashed_token_generation_throughput_sync": 0.022643256599628164, "smashed_token_generation_throughput_async": 0.022706127947077485, "smashed_token_generation_CO2_emissions": null, "smashed_token_generation_energy_consumption": null, "smashed_inference_latency_sync": 161.99608306884767, "smashed_inference_latency_async": 69.91302967071533, "smashed_inference_throughput_sync": 0.006172988760320854, "smashed_inference_throughput_async": 0.014303485411945647, "smashed_inference_CO2_emissions": null, "smashed_inference_energy_consumption": null }