"""Module containing performance results for the Arcee-SuperNova model.""" results_arcee_supernova = { "name": "Arcee-SuperNova", "modelType": "Llama 3.1 70B", "configurations": [ { "instanceType": "g5.12xlarge", "quantization": "awq", "container": "TGI 2.2.0", "status": "OK", "tokensPerSecond": "33", "notes": "", }, { "instanceType": "inf2.24xlarge", "configurations": [ { "quantization": "none", "container": "transformers-neuronx", "status": "KO", "tokensPerSecond": "-", "notes": "OOM bs=2,seqlen=4096", }, { "quantization": "none", "container": "transformers-neuronx", "status": "KO", "tokensPerSecond": "-", "notes": "OOM bs=2,seqlen=2048", }, ], }, { "instanceType": "inf2.48xlarge", "quantization": "none", "container": "transformers-neuronx", "status": "OK", "tokensPerSecond": "28.4", "notes": "bs=4,seqlen=4096", }, { "instanceType": "p4d.24xlarge", "quantization": "none", "container": "TGI 2.2.0", "status": "OK", "tokensPerSecond": "38", "notes": "", }, ], }