Spaces:
Running
Running
Julien Simon
commited on
Commit
•
ea42ef4
1
Parent(s):
8383fbb
Add SuperNova on trn1
Browse files- results.py +7 -0
- results_arcee_supernova.py +19 -0
results.py
CHANGED
@@ -157,6 +157,13 @@ instance_type_mappings = {
|
|
157 |
"url": "https://instances.vantage.sh/aws/ec2/inf2.48xlarge",
|
158 |
"price": 12.981,
|
159 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
160 |
}
|
161 |
|
162 |
results = {
|
|
|
157 |
"url": "https://instances.vantage.sh/aws/ec2/inf2.48xlarge",
|
158 |
"price": 12.981,
|
159 |
},
|
160 |
+
"trn1.32xlarge": {
|
161 |
+
"cloud": "AWS",
|
162 |
+
"gpu": "32xNeuronCore v2",
|
163 |
+
"gpuRAM": "512 GB",
|
164 |
+
"url": "https://instances.vantage.sh/aws/ec2/trn1.32xlarge",
|
165 |
+
"price": 21.50,
|
166 |
+
},
|
167 |
}
|
168 |
|
169 |
results = {
|
results_arcee_supernova.py
CHANGED
@@ -45,6 +45,13 @@ results_arcee_supernova = {
|
|
45 |
"tokensPerSecond": "-",
|
46 |
"notes": "OOM bs=2,seqlen=2048 - SDK 2.19.1",
|
47 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
48 |
],
|
49 |
},
|
50 |
{
|
@@ -73,6 +80,18 @@ results_arcee_supernova = {
|
|
73 |
},
|
74 |
],
|
75 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
76 |
{
|
77 |
"instanceType": "p4d.24xlarge",
|
78 |
"quantization": "none",
|
|
|
45 |
"tokensPerSecond": "-",
|
46 |
"notes": "OOM bs=2,seqlen=2048 - SDK 2.19.1",
|
47 |
},
|
48 |
+
{
|
49 |
+
"quantization": "8-bit",
|
50 |
+
"container": "LMI 0.29+transformers-neuronx 0.11.351",
|
51 |
+
"status": "???",
|
52 |
+
"tokensPerSecond": "???",
|
53 |
+
"notes": "bs=2,seqlen=8192 - SDK 2.19.1",
|
54 |
+
},
|
55 |
],
|
56 |
},
|
57 |
{
|
|
|
80 |
},
|
81 |
],
|
82 |
},
|
83 |
+
{
|
84 |
+
"instanceType": "trn1.32xlarge",
|
85 |
+
"configurations": [
|
86 |
+
{
|
87 |
+
"quantization": "none",
|
88 |
+
"container": "LMI 0.29+transformers-neuronx 0.11.351",
|
89 |
+
"status": "OK",
|
90 |
+
"tokensPerSecond": "32",
|
91 |
+
"notes": "bs=2,seqlen=8192 - SDK 2.19.1",
|
92 |
+
},
|
93 |
+
],
|
94 |
+
},
|
95 |
{
|
96 |
"instanceType": "p4d.24xlarge",
|
97 |
"quantization": "none",
|