kreas commited on
Commit
d6d242e
1 Parent(s): 9eaec6b

Upload /Llama-2-13b-hf/fp4_batch_size_1_sq_len_256_new_tokens_256/benchmark_report.json with huggingface_hub

Browse files
Llama-2-13b-hf/fp4_batch_size_1_sq_len_256_new_tokens_256/benchmark_report.json CHANGED
@@ -2,141 +2,140 @@
2
  "prefill": {
3
  "memory": {
4
  "unit": "MB",
5
- "max_ram": 1019.363328,
6
  "max_vram": 8359.247872,
7
  "max_reserved": 7874.80576,
8
  "max_allocated": 7776.413184
9
  },
10
  "latency": {
11
  "unit": "s",
12
- "mean": 0.0836540125528971,
13
- "stdev": 0.0004950226120967272,
14
  "values": [
15
- 0.08893036651611329,
16
- 0.08383487701416016,
17
- 0.08396697235107421,
18
- 0.08398339080810546,
19
- 0.08404889678955078,
20
- 0.08359935760498047,
21
- 0.08343449401855468,
22
- 0.08351436614990235,
23
- 0.08349900817871093,
24
- 0.08351744079589844,
25
- 0.08353997039794922,
26
- 0.08338739013671875,
27
- 0.08361779022216796,
28
- 0.08342221069335938,
29
- 0.08357478332519531,
30
- 0.08358911895751953,
31
- 0.08355020904541016,
32
- 0.08342745971679688,
33
- 0.08355532836914062,
34
- 0.08364543914794922,
35
- 0.08358809661865234,
36
- 0.08351026916503906,
37
- 0.08358399963378907,
38
- 0.08349388885498046,
39
- 0.08360038757324219,
40
- 0.08353596496582032,
41
- 0.0835962905883789,
42
- 0.08343961334228515,
43
- 0.08357695770263672,
44
- 0.08344064331054687,
45
- 0.08356352233886719,
46
- 0.08356668853759766,
47
- 0.08362290954589843,
48
- 0.08362496185302734,
49
- 0.08355532836914062,
50
- 0.08358502197265626,
51
- 0.08353587341308594,
52
- 0.08366284942626953,
53
- 0.08354918670654297,
54
- 0.08366284942626953,
55
- 0.08356658935546875,
56
- 0.08366182708740234,
57
- 0.08340377807617187,
58
- 0.08363724517822266,
59
- 0.08350003051757812,
60
- 0.08364031982421875,
61
- 0.08361676788330077,
62
- 0.08365055847167968,
63
- 0.08357785797119141,
64
- 0.08353401947021484,
65
- 0.08356364440917968,
66
- 0.08372940826416016,
67
- 0.08352460479736327,
68
- 0.08373350524902344,
69
- 0.08351846313476563,
70
- 0.08370893096923829,
71
- 0.08348467254638672,
72
- 0.08371302032470704,
73
- 0.0835563507080078,
74
- 0.0836648941040039,
75
- 0.08359321594238281,
76
- 0.0836648941040039,
77
- 0.08353485107421875,
78
- 0.0836157455444336,
79
- 0.08360550689697266,
80
- 0.0836659164428711,
81
- 0.08361164855957032,
82
- 0.0836495361328125,
83
- 0.083557373046875,
84
- 0.08371916961669922,
85
- 0.08353791809082031,
86
- 0.08374374389648437,
87
- 0.08362393951416015,
88
- 0.08375296020507812,
89
- 0.08338739013671875,
90
- 0.08369459533691406,
91
- 0.08367308807373047,
92
- 0.08367001342773438,
93
- 0.08354303741455078,
94
- 0.08365475463867188,
95
- 0.08365567779541015,
96
- 0.0836157455444336,
97
- 0.08364351654052735,
98
- 0.08361488342285156,
99
- 0.08365158081054687,
100
- 0.08356470489501953,
101
- 0.08364543914794922,
102
- 0.08368128204345703,
103
- 0.08365773010253906,
104
- 0.08355430603027343,
105
- 0.08367922973632813,
106
- 0.08345906829833985,
107
- 0.08357785797119141,
108
- 0.08364441680908204,
109
- 0.08360467529296875,
110
- 0.08360140991210938,
111
- 0.08359117126464843,
112
- 0.08353177642822265,
113
- 0.0836659164428711,
114
- 0.08361164855957032,
115
- 0.08363212585449219,
116
- 0.0835962905883789,
117
- 0.08364031982421875,
118
- 0.08354611206054688,
119
- 0.08392092895507812,
120
- 0.08359833526611328,
121
- 0.08363827514648438,
122
- 0.08354508972167969,
123
- 0.08355020904541016,
124
- 0.08361881256103515,
125
- 0.0835788803100586,
126
- 0.08365670776367187,
127
- 0.08373043060302734,
128
- 0.08362188720703125,
129
- 0.08371302032470704,
130
- 0.08370381164550782,
131
- 0.08365875244140625,
132
- 0.08364134216308594,
133
- 0.08365773010253906,
134
- 0.08356044769287109
135
  ]
136
  },
137
  "throughput": {
138
  "unit": "tokens/s",
139
- "value": 3060.2237978497806
140
  },
141
  "energy": null,
142
  "efficiency": null
@@ -144,22 +143,22 @@
144
  "decode": {
145
  "memory": {
146
  "unit": "MB",
147
- "max_ram": 1019.363328,
148
  "max_vram": 9105.833984,
149
  "max_reserved": 8621.391872,
150
  "max_allocated": 8484.938752
151
  },
152
  "latency": {
153
  "unit": "s",
154
- "mean": 10.723862522125254,
155
  "stdev": 0,
156
  "values": [
157
- 10.723862522125254
158
  ]
159
  },
160
  "throughput": {
161
  "unit": "tokens/s",
162
- "value": 23.77874571535109
163
  },
164
  "energy": null,
165
  "efficiency": null
@@ -168,269 +167,269 @@
168
  "memory": null,
169
  "latency": {
170
  "unit": "s",
171
- "mean": 0.04205436283186374,
172
- "stdev": 0.00016867759279344603,
173
  "values": [
174
- 0.04243769454956055,
175
- 0.04276249694824219,
176
- 0.041958080291748044,
177
- 0.04204054260253906,
178
- 0.041990238189697264,
179
- 0.042020542144775394,
180
- 0.04208639907836914,
181
- 0.0421163215637207,
182
- 0.04202883148193359,
183
- 0.04214281463623047,
184
- 0.04195625686645508,
185
- 0.042035263061523435,
186
- 0.042060928344726564,
187
- 0.04195644760131836,
188
- 0.04194915390014648,
189
- 0.04201446533203125,
190
- 0.041931007385253904,
191
- 0.04209231948852539,
192
- 0.041755870819091795,
193
- 0.04209126281738281,
194
- 0.041973758697509765,
195
- 0.04218572616577149,
196
- 0.04186636734008789,
197
- 0.04215411376953125,
198
- 0.04221721649169922,
199
- 0.04212940979003906,
200
- 0.04205267333984375,
201
- 0.042124225616455076,
202
- 0.04215193557739258,
203
- 0.04208947372436524,
204
- 0.04196044921875,
205
- 0.04206611251831055,
206
- 0.04249375915527344,
207
- 0.04209971237182617,
208
- 0.04207430267333984,
209
- 0.041922367095947266,
210
- 0.04214886474609375,
211
- 0.042041534423828124,
212
- 0.04205065536499023,
213
- 0.04199497604370117,
214
- 0.04206003189086914,
215
- 0.0419480972290039,
216
- 0.04211692810058594,
217
- 0.04226764678955078,
218
- 0.04206796646118164,
219
- 0.042092544555664066,
220
- 0.042011646270751955,
221
- 0.04193075180053711,
222
- 0.04185190582275391,
223
- 0.04216947174072266,
224
- 0.0418917121887207,
225
- 0.04214681625366211,
226
- 0.04191971206665039,
227
- 0.04193974304199219,
228
- 0.04192051315307617,
229
- 0.04207820892333984,
230
- 0.04203747177124023,
231
- 0.04211606216430664,
232
- 0.04280710220336914,
233
- 0.04209868621826172,
234
- 0.04174540710449219,
235
- 0.041919486999511715,
236
- 0.04193484878540039,
237
- 0.0419317741394043,
238
- 0.04189184188842773,
239
- 0.04213862228393555,
240
- 0.04188678359985352,
241
- 0.041958335876464845,
242
- 0.042090496063232424,
243
- 0.042049537658691405,
244
- 0.042033153533935545,
245
- 0.04197273635864258,
246
- 0.04207206344604492,
247
- 0.04225024032592774,
248
- 0.04209664154052734,
249
- 0.04206003189086914,
250
- 0.04214246368408203,
251
- 0.042234878540039066,
252
- 0.04206700897216797,
253
- 0.04203411102294922,
254
- 0.04239974212646484,
255
- 0.04236288070678711,
256
- 0.042031105041503904,
257
- 0.04196147155761719,
258
- 0.04199321746826172,
259
- 0.04216012954711914,
260
- 0.042221569061279295,
261
- 0.04207132720947265,
262
- 0.04227350234985352,
263
- 0.04233830261230469,
264
- 0.04214374542236328,
265
- 0.04254719924926758,
266
- 0.041981952667236325,
267
- 0.04189081573486328,
268
- 0.041973758697509765,
269
- 0.04208537673950195,
270
- 0.04187443161010742,
271
- 0.04192972946166992,
272
- 0.04190617752075195,
273
- 0.04196249771118164,
274
- 0.04190003204345703,
275
- 0.04210905456542969,
276
- 0.04186304092407227,
277
- 0.04199423980712891,
278
- 0.04184371185302734,
279
- 0.04199731063842774,
280
- 0.04178841781616211,
281
- 0.04206489562988281,
282
- 0.04204339218139649,
283
- 0.042052608489990234,
284
- 0.041801727294921875,
285
- 0.04189798355102539,
286
- 0.041880577087402344,
287
- 0.04199731063842774,
288
- 0.04173030471801758,
289
- 0.041860862731933596,
290
- 0.0419288330078125,
291
- 0.04200128173828125,
292
- 0.041987071990966796,
293
- 0.0420118408203125,
294
- 0.04192748641967774,
295
- 0.04208947372436524,
296
- 0.041902080535888675,
297
- 0.042021888732910156,
298
- 0.042103809356689455,
299
- 0.04203519821166992,
300
- 0.04205567932128906,
301
- 0.04191641616821289,
302
- 0.04273664093017578,
303
- 0.042102783203125,
304
- 0.042071041107177735,
305
- 0.04190851211547852,
306
- 0.041956062316894534,
307
- 0.041990142822265625,
308
- 0.04193382263183594,
309
- 0.04182425689697265,
310
- 0.042016769409179686,
311
- 0.042310657501220705,
312
- 0.04207308959960938,
313
- 0.04248166275024414,
314
- 0.04210483169555664,
315
- 0.042229793548583985,
316
- 0.04196063995361328,
317
- 0.04214163208007812,
318
- 0.04209648132324219,
319
- 0.042145790100097655,
320
- 0.04211199951171875,
321
- 0.04187977600097656,
322
- 0.042318782806396484,
323
- 0.0418240966796875,
324
- 0.04203519821166992,
325
- 0.042076160430908206,
326
- 0.042164222717285156,
327
- 0.042310657501220705,
328
- 0.04257382583618164,
329
- 0.04201372909545899,
330
- 0.04203414535522461,
331
- 0.04188159942626953,
332
- 0.04205363082885742,
333
- 0.04189811325073242,
334
- 0.041983871459960936,
335
- 0.04196249771118164,
336
- 0.04201267242431641,
337
- 0.041931041717529295,
338
- 0.04218751907348633,
339
- 0.04189081573486328,
340
- 0.04189487838745117,
341
- 0.041973758697509765,
342
- 0.04204646301269531,
343
- 0.04222777557373047,
344
- 0.04200646209716797,
345
- 0.04234550476074219,
346
- 0.042064865112304686,
347
- 0.04199423980712891,
348
- 0.041970687866210936,
349
- 0.04220415878295898,
350
- 0.042650688171386716,
351
- 0.04211523056030273,
352
- 0.042135326385498044,
353
- 0.042028030395507815,
354
- 0.04226559829711914,
355
- 0.04201881790161133,
356
- 0.042008575439453126,
357
- 0.042028030395507815,
358
- 0.04200681686401367,
359
- 0.041908958435058596,
360
- 0.04208230209350586,
361
- 0.04252979278564453,
362
- 0.04196556854248047,
363
- 0.04192998504638672,
364
- 0.042114814758300784,
365
- 0.042188800811767575,
366
- 0.042016769409179686,
367
- 0.042434558868408204,
368
- 0.04198092651367188,
369
- 0.041879745483398435,
370
- 0.04222137451171875,
371
- 0.04189491271972656,
372
- 0.04216960144042969,
373
- 0.04200115203857422,
374
- 0.04220134353637695,
375
- 0.04171772766113281,
376
- 0.04197891235351563,
377
- 0.04201548767089844,
378
- 0.042052608489990234,
379
- 0.04190617752075195,
380
- 0.04195532989501953,
381
- 0.04198092651367188,
382
- 0.04211711883544922,
383
- 0.041826305389404295,
384
- 0.04204339218139649,
385
- 0.041989345550537106,
386
- 0.04184963226318359,
387
- 0.04198092651367188,
388
- 0.04197273635864258,
389
- 0.041902080535888675,
390
- 0.04210300827026367,
391
- 0.04187625503540039,
392
- 0.041801727294921875,
393
- 0.04195942306518555,
394
- 0.04183369445800781,
395
- 0.041998336791992184,
396
- 0.04205033493041992,
397
- 0.04211609649658203,
398
- 0.04238438415527344,
399
- 0.042060001373291016,
400
- 0.04198070526123047,
401
- 0.042102783203125,
402
- 0.042092544555664066,
403
- 0.042151966094970704,
404
- 0.04178531265258789,
405
- 0.04196147155761719,
406
- 0.04178025436401367,
407
- 0.04200649642944336,
408
- 0.04227276611328125,
409
- 0.042343425750732425,
410
- 0.041955486297607425,
411
- 0.0421069450378418,
412
- 0.04194793701171875,
413
- 0.042175487518310545,
414
- 0.041864192962646485,
415
- 0.04201881790161133,
416
- 0.04206716918945313,
417
- 0.04197788619995117,
418
- 0.041975551605224606,
419
- 0.04206911849975586,
420
- 0.04215692901611328,
421
- 0.042033153533935545,
422
- 0.04213043212890625,
423
- 0.042202110290527346,
424
- 0.04206182479858398,
425
- 0.04206502532958984,
426
- 0.04209360122680664,
427
- 0.042119007110595706,
428
- 0.042033153533935545
429
  ]
430
  },
431
  "throughput": {
432
  "unit": "tokens/s",
433
- "value": 23.77874571535109
434
  },
435
  "energy": null,
436
  "efficiency": null
 
2
  "prefill": {
3
  "memory": {
4
  "unit": "MB",
5
+ "max_ram": 996.048896,
6
  "max_vram": 8359.247872,
7
  "max_reserved": 7874.80576,
8
  "max_allocated": 7776.413184
9
  },
10
  "latency": {
11
  "unit": "s",
12
+ "mean": 0.08431502924045597,
13
+ "stdev": 0.00040203161198162625,
14
  "values": [
15
+ 0.08844000244140625,
16
+ 0.08441766357421875,
17
+ 0.0846929931640625,
18
+ 0.08442675018310547,
19
+ 0.08467660522460937,
20
+ 0.08479641723632812,
21
+ 0.0844615707397461,
22
+ 0.08435302734375,
23
+ 0.08427519989013672,
24
+ 0.0841185302734375,
25
+ 0.08421376037597657,
26
+ 0.08410214233398437,
27
+ 0.08433356475830078,
28
+ 0.08408780670166016,
29
+ 0.08421887969970702,
30
+ 0.08420454406738281,
31
+ 0.0842086410522461,
32
+ 0.0839362564086914,
33
+ 0.08416767883300781,
34
+ 0.08417705535888671,
35
+ 0.08422297668457031,
36
+ 0.08422297668457031,
37
+ 0.08423833465576172,
38
+ 0.08427008056640625,
39
+ 0.08439193725585938,
40
+ 0.08415654754638671,
41
+ 0.08424447631835938,
42
+ 0.08415846252441406,
43
+ 0.08426905822753906,
44
+ 0.08415436553955079,
45
+ 0.08425881958007812,
46
+ 0.08411341094970703,
47
+ 0.08425472259521484,
48
+ 0.08420454406738281,
49
+ 0.08422297668457031,
50
+ 0.08424038696289063,
51
+ 0.08416255950927734,
52
+ 0.08432640075683594,
53
+ 0.08425369262695312,
54
+ 0.08429875183105469,
55
+ 0.0842608642578125,
56
+ 0.08443196868896484,
57
+ 0.08400895690917969,
58
+ 0.08427622222900391,
59
+ 0.08412057495117188,
60
+ 0.08431718444824218,
61
+ 0.08428543853759765,
62
+ 0.08428237152099609,
63
+ 0.08414412689208985,
64
+ 0.08424960327148437,
65
+ 0.08420966339111328,
66
+ 0.08448716735839844,
67
+ 0.08413081359863281,
68
+ 0.08428749084472656,
69
+ 0.08420146942138672,
70
+ 0.08425984191894531,
71
+ 0.08418118286132813,
72
+ 0.08424755096435547,
73
+ 0.08416255950927734,
74
+ 0.08432434844970703,
75
+ 0.0841871337890625,
76
+ 0.08450559997558593,
77
+ 0.08425676727294922,
78
+ 0.0842639389038086,
79
+ 0.08424038696289063,
80
+ 0.08428749084472656,
81
+ 0.08428749084472656,
82
+ 0.08481587219238282,
83
+ 0.08422911834716797,
84
+ 0.08442060852050781,
85
+ 0.0841185302734375,
86
+ 0.08432947540283203,
87
+ 0.08421785736083984,
88
+ 0.08435302734375,
89
+ 0.0840970230102539,
90
+ 0.08442265319824219,
91
+ 0.08430796813964844,
92
+ 0.08434893035888671,
93
+ 0.08424140930175782,
94
+ 0.08421785736083984,
95
+ 0.08419942474365234,
96
+ 0.08425676727294922,
97
+ 0.08434073638916016,
98
+ 0.0841871337890625,
99
+ 0.08451289367675781,
100
+ 0.08438784027099609,
101
+ 0.08437452697753907,
102
+ 0.08432537841796875,
103
+ 0.08432640075683594,
104
+ 0.08425692749023438,
105
+ 0.08422297668457031,
106
+ 0.08420368194580079,
107
+ 0.08416665649414062,
108
+ 0.08435404968261719,
109
+ 0.08437657928466796,
110
+ 0.08446669006347657,
111
+ 0.08417382049560547,
112
+ 0.08422911834716797,
113
+ 0.08421580505371094,
114
+ 0.08437760162353515,
115
+ 0.08416767883300781,
116
+ 0.08433663940429688,
117
+ 0.08420352172851563,
118
+ 0.08436531066894531,
119
+ 0.08433062744140625,
120
+ 0.08433267211914063,
121
+ 0.08421376037597657,
122
+ 0.08432537841796875,
123
+ 0.08431820678710937,
124
+ 0.08427827453613282,
125
+ 0.08424960327148437,
126
+ 0.08421683502197265,
127
+ 0.08426290893554687,
128
+ 0.08434175872802735,
129
+ 0.08423423767089844,
130
+ 0.08434381103515624,
131
+ 0.08421376037597657,
132
+ 0.08446771240234376,
133
+ 0.08433766174316407
 
134
  ]
135
  },
136
  "throughput": {
137
  "unit": "tokens/s",
138
+ "value": 3036.232120253672
139
  },
140
  "energy": null,
141
  "efficiency": null
 
143
  "decode": {
144
  "memory": {
145
  "unit": "MB",
146
+ "max_ram": 996.048896,
147
  "max_vram": 9105.833984,
148
  "max_reserved": 8621.391872,
149
  "max_allocated": 8484.938752
150
  },
151
  "latency": {
152
  "unit": "s",
153
+ "mean": 12.58805863571167,
154
  "stdev": 0,
155
  "values": [
156
+ 12.58805863571167
157
  ]
158
  },
159
  "throughput": {
160
  "unit": "tokens/s",
161
+ "value": 20.257293628787064
162
  },
163
  "energy": null,
164
  "efficiency": null
 
167
  "memory": null,
168
  "latency": {
169
  "unit": "s",
170
+ "mean": 0.049364935826320275,
171
+ "stdev": 0.0006250009736365216,
172
  "values": [
173
+ 0.050045951843261716,
174
+ 0.050549758911132815,
175
+ 0.04905881500244141,
176
+ 0.049223678588867184,
177
+ 0.04921241760253906,
178
+ 0.04918476867675781,
179
+ 0.0490618896484375,
180
+ 0.04925235366821289,
181
+ 0.04913356781005859,
182
+ 0.049070079803466796,
183
+ 0.04906415939331055,
184
+ 0.049048351287841796,
185
+ 0.0491069450378418,
186
+ 0.04908031845092774,
187
+ 0.04897177505493164,
188
+ 0.04919500732421875,
189
+ 0.04905984115600586,
190
+ 0.04918067169189453,
191
+ 0.048998401641845706,
192
+ 0.04954838562011719,
193
+ 0.04929014587402344,
194
+ 0.049086463928222655,
195
+ 0.04898918533325195,
196
+ 0.04926464080810547,
197
+ 0.049288192749023435,
198
+ 0.04907929611206055,
199
+ 0.04902604675292969,
200
+ 0.049334270477294925,
201
+ 0.04930047988891602,
202
+ 0.04938240051269531,
203
+ 0.0491952018737793,
204
+ 0.04916307067871094,
205
+ 0.0492410888671875,
206
+ 0.04933017730712891,
207
+ 0.049465343475341796,
208
+ 0.049296382904052735,
209
+ 0.04907724761962891,
210
+ 0.04973567962646484,
211
+ 0.04940288162231445,
212
+ 0.04961280059814453,
213
+ 0.04922265625,
214
+ 0.049223678588867184,
215
+ 0.05130035018920898,
216
+ 0.053032958984375,
217
+ 0.05166080093383789,
218
+ 0.04976435089111328,
219
+ 0.049347583770751956,
220
+ 0.04949913787841797,
221
+ 0.05000089645385742,
222
+ 0.04948889541625977,
223
+ 0.049364192962646485,
224
+ 0.04938524627685547,
225
+ 0.04942540740966797,
226
+ 0.049616897583007816,
227
+ 0.04949401473999023,
228
+ 0.049522689819335934,
229
+ 0.049209342956542966,
230
+ 0.049756160736083986,
231
+ 0.049261566162109374,
232
+ 0.04916121673583984,
233
+ 0.04927897644042969,
234
+ 0.04918067169189453,
235
+ 0.04941721725463867,
236
+ 0.04925747299194336,
237
+ 0.04932812881469727,
238
+ 0.049314815521240236,
239
+ 0.049127422332763675,
240
+ 0.049242111206054685,
241
+ 0.049479679107666014,
242
+ 0.04937932968139649,
243
+ 0.049360897064208986,
244
+ 0.04937830352783203,
245
+ 0.04914483261108398,
246
+ 0.0493834228515625,
247
+ 0.049345535278320314,
248
+ 0.0496732177734375,
249
+ 0.04932198333740234,
250
+ 0.04935168075561523,
251
+ 0.04931891250610351,
252
+ 0.04920012664794922,
253
+ 0.049081344604492184,
254
+ 0.049523998260498046,
255
+ 0.04912815856933594,
256
+ 0.04919807815551758,
257
+ 0.04916633605957031,
258
+ 0.05008895874023438,
259
+ 0.049667072296142575,
260
+ 0.04940595245361328,
261
+ 0.04916326522827148,
262
+ 0.0492308464050293,
263
+ 0.04961075210571289,
264
+ 0.04929228973388672,
265
+ 0.04914790344238281,
266
+ 0.04931382369995117,
267
+ 0.049317855834960934,
268
+ 0.04941209411621094,
269
+ 0.04901068878173828,
270
+ 0.04927283096313476,
271
+ 0.04907212829589844,
272
+ 0.049396736145019535,
273
+ 0.04896768188476563,
274
+ 0.0493199348449707,
275
+ 0.04884889602661133,
276
+ 0.049181697845458984,
277
+ 0.0492042236328125,
278
+ 0.04927385711669922,
279
+ 0.04905574417114258,
280
+ 0.04904243087768555,
281
+ 0.04924620819091797,
282
+ 0.049301502227783206,
283
+ 0.04909568023681641,
284
+ 0.049105918884277344,
285
+ 0.04917964935302734,
286
+ 0.04949401473999023,
287
+ 0.049002494812011715,
288
+ 0.05694668960571289,
289
+ 0.05214617538452149,
290
+ 0.04937318420410156,
291
+ 0.04948070526123047,
292
+ 0.049363967895507815,
293
+ 0.0493383674621582,
294
+ 0.049339393615722656,
295
+ 0.04939468765258789,
296
+ 0.04941619110107422,
297
+ 0.049294334411621094,
298
+ 0.04968447875976562,
299
+ 0.04934348678588867,
300
+ 0.04922777557373047,
301
+ 0.049331199645996096,
302
+ 0.04928102493286133,
303
+ 0.049185791015625,
304
+ 0.04919807815551758,
305
+ 0.04931071853637695,
306
+ 0.049309696197509766,
307
+ 0.04937932968139649,
308
+ 0.04939571380615235,
309
+ 0.04918476867675781,
310
+ 0.04913356781005859,
311
+ 0.049181697845458984,
312
+ 0.04927897644042969,
313
+ 0.04932198333740234,
314
+ 0.049107967376708986,
315
+ 0.04920832061767578,
316
+ 0.049086463928222655,
317
+ 0.04929024124145508,
318
+ 0.04934963226318359,
319
+ 0.049672191619873046,
320
+ 0.049206272125244144,
321
+ 0.04924518585205078,
322
+ 0.04909465789794922,
323
+ 0.04922470474243164,
324
+ 0.04916940689086914,
325
+ 0.04929024124145508,
326
+ 0.049560577392578124,
327
+ 0.05010432052612305,
328
+ 0.04920217514038086,
329
+ 0.04918476867675781,
330
+ 0.049320960998535154,
331
+ 0.049361919403076174,
332
+ 0.04940595245361328,
333
+ 0.04930047988891602,
334
+ 0.049617919921875,
335
+ 0.04935168075561523,
336
+ 0.04929228973388672,
337
+ 0.04930252838134765,
338
+ 0.049288192749023435,
339
+ 0.049468414306640625,
340
+ 0.04925030517578125,
341
+ 0.04933222579956055,
342
+ 0.04927385711669922,
343
+ 0.049375232696533204,
344
+ 0.04945407867431641,
345
+ 0.049309696197509766,
346
+ 0.0492308464050293,
347
+ 0.04942950439453125,
348
+ 0.04943360137939453,
349
+ 0.049334270477294925,
350
+ 0.04921548843383789,
351
+ 0.049484798431396484,
352
+ 0.049361919403076174,
353
+ 0.04925235366821289,
354
+ 0.04940390396118164,
355
+ 0.0493834228515625,
356
+ 0.04935168075561523,
357
+ 0.04922880172729492,
358
+ 0.049306625366210936,
359
+ 0.04932812881469727,
360
+ 0.049432575225830076,
361
+ 0.0493834228515625,
362
+ 0.04927385711669922,
363
+ 0.04948070526123047,
364
+ 0.04924620819091797,
365
+ 0.04941619110107422,
366
+ 0.04921139144897461,
367
+ 0.049492992401123044,
368
+ 0.049181697845458984,
369
+ 0.04935065460205078,
370
+ 0.049476608276367184,
371
+ 0.04942131042480469,
372
+ 0.049329151153564454,
373
+ 0.049225727081298826,
374
+ 0.04904959869384766,
375
+ 0.049552383422851565,
376
+ 0.049159168243408206,
377
+ 0.04922060775756836,
378
+ 0.049342464447021485,
379
+ 0.04935168075561523,
380
+ 0.04923699188232422,
381
+ 0.049337345123291014,
382
+ 0.04924415969848633,
383
+ 0.0491960334777832,
384
+ 0.049288192749023435,
385
+ 0.049393665313720705,
386
+ 0.049111038208007815,
387
+ 0.04942233657836914,
388
+ 0.04956671905517578,
389
+ 0.049500160217285157,
390
+ 0.04905062484741211,
391
+ 0.049075199127197267,
392
+ 0.049242111206054685,
393
+ 0.049279998779296875,
394
+ 0.04906291198730469,
395
+ 0.04917964935302734,
396
+ 0.04926054382324219,
397
+ 0.049102848052978515,
398
+ 0.04927590560913086,
399
+ 0.04932223892211914,
400
+ 0.049382144927978516,
401
+ 0.04914585494995117,
402
+ 0.04912025451660156,
403
+ 0.04916633605957031,
404
+ 0.0491253776550293,
405
+ 0.04920012664794922,
406
+ 0.049132545471191405,
407
+ 0.049105918884277344,
408
+ 0.049312767028808595,
409
+ 0.04894617462158203,
410
+ 0.04911718368530273,
411
+ 0.04921036911010742,
412
+ 0.049396736145019535,
413
+ 0.04896051025390625,
414
+ 0.04924518585205078,
415
+ 0.04909363174438477,
416
+ 0.049165313720703124,
417
+ 0.049121280670166016,
418
+ 0.04954521560668945,
419
+ 0.04903219223022461,
420
+ 0.04931071853637695,
421
+ 0.04907417678833008,
422
+ 0.049157119750976565,
423
+ 0.048952320098876956,
424
+ 0.04926873779296875,
425
+ 0.04894617462158203,
426
+ 0.04913663864135742,
427
+ 0.048998401641845706
428
  ]
429
  },
430
  "throughput": {
431
  "unit": "tokens/s",
432
+ "value": 20.257293628787064
433
  },
434
  "energy": null,
435
  "efficiency": null