{ "Model": "microsoft/Phi-3-small-8k-instruct", "GPU": "NVIDIA A100-SXM4-40GB", "TP": 1, "PP": 1, "Energy/req (J)": 45.645894049912414, "Avg TPOT (s)": 0.14053497655998956, "Token tput (tok/s)": 1547.4100016905459, "Avg Output Tokens": 404.468, "Avg BS (reqs)": 255.41870401139332, "Max BS (reqs)": 256 }