Julien Simon commited on
Commit
ea42ef4
1 Parent(s): 8383fbb

Add SuperNova on trn1

Browse files
Files changed (2) hide show
  1. results.py +7 -0
  2. results_arcee_supernova.py +19 -0
results.py CHANGED
@@ -157,6 +157,13 @@ instance_type_mappings = {
157
  "url": "https://instances.vantage.sh/aws/ec2/inf2.48xlarge",
158
  "price": 12.981,
159
  },
 
 
 
 
 
 
 
160
  }
161
 
162
  results = {
 
157
  "url": "https://instances.vantage.sh/aws/ec2/inf2.48xlarge",
158
  "price": 12.981,
159
  },
160
+ "trn1.32xlarge": {
161
+ "cloud": "AWS",
162
+ "gpu": "32xNeuronCore v2",
163
+ "gpuRAM": "512 GB",
164
+ "url": "https://instances.vantage.sh/aws/ec2/trn1.32xlarge",
165
+ "price": 21.50,
166
+ },
167
  }
168
 
169
  results = {
results_arcee_supernova.py CHANGED
@@ -45,6 +45,13 @@ results_arcee_supernova = {
45
  "tokensPerSecond": "-",
46
  "notes": "OOM bs=2,seqlen=2048 - SDK 2.19.1",
47
  },
 
 
 
 
 
 
 
48
  ],
49
  },
50
  {
@@ -73,6 +80,18 @@ results_arcee_supernova = {
73
  },
74
  ],
75
  },
 
 
 
 
 
 
 
 
 
 
 
 
76
  {
77
  "instanceType": "p4d.24xlarge",
78
  "quantization": "none",
 
45
  "tokensPerSecond": "-",
46
  "notes": "OOM bs=2,seqlen=2048 - SDK 2.19.1",
47
  },
48
+ {
49
+ "quantization": "8-bit",
50
+ "container": "LMI 0.29+transformers-neuronx 0.11.351",
51
+ "status": "???",
52
+ "tokensPerSecond": "???",
53
+ "notes": "bs=2,seqlen=8192 - SDK 2.19.1",
54
+ },
55
  ],
56
  },
57
  {
 
80
  },
81
  ],
82
  },
83
+ {
84
+ "instanceType": "trn1.32xlarge",
85
+ "configurations": [
86
+ {
87
+ "quantization": "none",
88
+ "container": "LMI 0.29+transformers-neuronx 0.11.351",
89
+ "status": "OK",
90
+ "tokensPerSecond": "32",
91
+ "notes": "bs=2,seqlen=8192 - SDK 2.19.1",
92
+ },
93
+ ],
94
+ },
95
  {
96
  "instanceType": "p4d.24xlarge",
97
  "quantization": "none",