sauravpanda commited on
Commit
d684f24
·
verified ·
1 Parent(s): e531904

Upload folder using huggingface_hub

Browse files
mlc-chat-config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "version": "0.1.0",
3
  "model_type": "qwen2",
4
- "quantization": "q4f16_1",
5
  "model_config": {
6
  "hidden_act": "silu",
7
  "hidden_size": 1536,
 
1
  {
2
  "version": "0.1.0",
3
  "model_type": "qwen2",
4
+ "quantization": "q4f32_1",
5
  "model_config": {
6
  "hidden_act": "silu",
7
  "hidden_size": 1536,
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "metadata": {
3
  "ParamSize": 313,
4
- "ParamBytes": 999820288.0,
5
- "BitsPerParam": 4.500937659812007
6
  },
7
  "records": [
8
  {
@@ -22,7 +22,7 @@
22
  "byteOffset": 0
23
  }
24
  ],
25
- "md5sum": "f5deae0fcd34d27eab8c21a024c8f711"
26
  },
27
  {
28
  "dataPath": "params_shard_1.bin",
@@ -41,7 +41,7 @@
41
  "byteOffset": 0
42
  }
43
  ],
44
- "md5sum": "accc7a495594768625d8469380130b72"
45
  },
46
  {
47
  "dataPath": "params_shard_2.bin",
@@ -54,7 +54,7 @@
54
  151936,
55
  48
56
  ],
57
- "dtype": "float16",
58
  "format": "f32-to-bf16",
59
  "nbytes": 14585856,
60
  "byteOffset": 0
@@ -65,7 +65,7 @@
65
  151936,
66
  48
67
  ],
68
- "dtype": "float16",
69
  "format": "f32-to-bf16",
70
  "nbytes": 14585856,
71
  "byteOffset": 14585856
@@ -75,13 +75,13 @@
75
  "shape": [
76
  1536
77
  ],
78
- "dtype": "float16",
79
  "format": "f32-to-bf16",
80
  "nbytes": 3072,
81
  "byteOffset": 29171712
82
  }
83
  ],
84
- "md5sum": "ae1dfada404728dce402091f4401ccd4"
85
  },
86
  {
87
  "dataPath": "params_shard_3.bin",
@@ -105,7 +105,7 @@
105
  1536,
106
  280
107
  ],
108
- "dtype": "float16",
109
  "format": "f32-to-bf16",
110
  "nbytes": 860160,
111
  "byteOffset": 6881280
@@ -127,7 +127,7 @@
127
  17920,
128
  48
129
  ],
130
- "dtype": "float16",
131
  "format": "f32-to-bf16",
132
  "nbytes": 1720320,
133
  "byteOffset": 21504000
@@ -137,7 +137,7 @@
137
  "shape": [
138
  1536
139
  ],
140
- "dtype": "float16",
141
  "format": "f32-to-bf16",
142
  "nbytes": 3072,
143
  "byteOffset": 23224320
@@ -147,7 +147,7 @@
147
  "shape": [
148
  2048
149
  ],
150
- "dtype": "float16",
151
  "format": "f32-to-bf16",
152
  "nbytes": 4096,
153
  "byteOffset": 23227392
@@ -169,7 +169,7 @@
169
  2048,
170
  48
171
  ],
172
- "dtype": "float16",
173
  "format": "f32-to-bf16",
174
  "nbytes": 196608,
175
  "byteOffset": 24804352
@@ -191,7 +191,7 @@
191
  1536,
192
  48
193
  ],
194
- "dtype": "float16",
195
  "format": "f32-to-bf16",
196
  "nbytes": 147456,
197
  "byteOffset": 26180608
@@ -201,7 +201,7 @@
201
  "shape": [
202
  1536
203
  ],
204
- "dtype": "float16",
205
  "format": "f32-to-bf16",
206
  "nbytes": 3072,
207
  "byteOffset": 26328064
@@ -218,7 +218,7 @@
218
  "byteOffset": 26331136
219
  }
220
  ],
221
- "md5sum": "1820f3fd356105d481dd8b01eea1915f"
222
  },
223
  {
224
  "dataPath": "params_shard_4.bin",
@@ -231,7 +231,7 @@
231
  1536,
232
  280
233
  ],
234
- "dtype": "float16",
235
  "format": "f32-to-bf16",
236
  "nbytes": 860160,
237
  "byteOffset": 0
@@ -253,7 +253,7 @@
253
  17920,
254
  48
255
  ],
256
- "dtype": "float16",
257
  "format": "f32-to-bf16",
258
  "nbytes": 1720320,
259
  "byteOffset": 14622720
@@ -263,7 +263,7 @@
263
  "shape": [
264
  1536
265
  ],
266
- "dtype": "float16",
267
  "format": "f32-to-bf16",
268
  "nbytes": 3072,
269
  "byteOffset": 16343040
@@ -273,7 +273,7 @@
273
  "shape": [
274
  2048
275
  ],
276
- "dtype": "float16",
277
  "format": "f32-to-bf16",
278
  "nbytes": 4096,
279
  "byteOffset": 16346112
@@ -295,7 +295,7 @@
295
  2048,
296
  48
297
  ],
298
- "dtype": "float16",
299
  "format": "f32-to-bf16",
300
  "nbytes": 196608,
301
  "byteOffset": 17923072
@@ -317,7 +317,7 @@
317
  1536,
318
  48
319
  ],
320
- "dtype": "float16",
321
  "format": "f32-to-bf16",
322
  "nbytes": 147456,
323
  "byteOffset": 19299328
@@ -327,7 +327,7 @@
327
  "shape": [
328
  1536
329
  ],
330
- "dtype": "float16",
331
  "format": "f32-to-bf16",
332
  "nbytes": 3072,
333
  "byteOffset": 19446784
@@ -349,13 +349,13 @@
349
  1536,
350
  280
351
  ],
352
- "dtype": "float16",
353
  "format": "f32-to-bf16",
354
  "nbytes": 860160,
355
  "byteOffset": 26331136
356
  }
357
  ],
358
- "md5sum": "8a33e6af3a9e36d80c960b9f39589377"
359
  },
360
  {
361
  "dataPath": "params_shard_5.bin",
@@ -379,7 +379,7 @@
379
  17920,
380
  48
381
  ],
382
- "dtype": "float16",
383
  "format": "f32-to-bf16",
384
  "nbytes": 1720320,
385
  "byteOffset": 13762560
@@ -389,7 +389,7 @@
389
  "shape": [
390
  1536
391
  ],
392
- "dtype": "float16",
393
  "format": "f32-to-bf16",
394
  "nbytes": 3072,
395
  "byteOffset": 15482880
@@ -399,7 +399,7 @@
399
  "shape": [
400
  2048
401
  ],
402
- "dtype": "float16",
403
  "format": "f32-to-bf16",
404
  "nbytes": 4096,
405
  "byteOffset": 15485952
@@ -421,7 +421,7 @@
421
  2048,
422
  48
423
  ],
424
- "dtype": "float16",
425
  "format": "f32-to-bf16",
426
  "nbytes": 196608,
427
  "byteOffset": 17062912
@@ -443,7 +443,7 @@
443
  1536,
444
  48
445
  ],
446
- "dtype": "float16",
447
  "format": "f32-to-bf16",
448
  "nbytes": 147456,
449
  "byteOffset": 18439168
@@ -453,7 +453,7 @@
453
  "shape": [
454
  1536
455
  ],
456
- "dtype": "float16",
457
  "format": "f32-to-bf16",
458
  "nbytes": 3072,
459
  "byteOffset": 18586624
@@ -475,13 +475,13 @@
475
  1536,
476
  280
477
  ],
478
- "dtype": "float16",
479
  "format": "f32-to-bf16",
480
  "nbytes": 860160,
481
  "byteOffset": 25470976
482
  }
483
  ],
484
- "md5sum": "c1c00d4d1226da4dc6582a63544f0be7"
485
  },
486
  {
487
  "dataPath": "params_shard_6.bin",
@@ -505,7 +505,7 @@
505
  17920,
506
  48
507
  ],
508
- "dtype": "float16",
509
  "format": "f32-to-bf16",
510
  "nbytes": 1720320,
511
  "byteOffset": 13762560
@@ -515,7 +515,7 @@
515
  "shape": [
516
  1536
517
  ],
518
- "dtype": "float16",
519
  "format": "f32-to-bf16",
520
  "nbytes": 3072,
521
  "byteOffset": 15482880
@@ -525,7 +525,7 @@
525
  "shape": [
526
  2048
527
  ],
528
- "dtype": "float16",
529
  "format": "f32-to-bf16",
530
  "nbytes": 4096,
531
  "byteOffset": 15485952
@@ -547,7 +547,7 @@
547
  2048,
548
  48
549
  ],
550
- "dtype": "float16",
551
  "format": "f32-to-bf16",
552
  "nbytes": 196608,
553
  "byteOffset": 17062912
@@ -569,7 +569,7 @@
569
  1536,
570
  48
571
  ],
572
- "dtype": "float16",
573
  "format": "f32-to-bf16",
574
  "nbytes": 147456,
575
  "byteOffset": 18439168
@@ -579,7 +579,7 @@
579
  "shape": [
580
  1536
581
  ],
582
- "dtype": "float16",
583
  "format": "f32-to-bf16",
584
  "nbytes": 3072,
585
  "byteOffset": 18586624
@@ -601,13 +601,13 @@
601
  1536,
602
  280
603
  ],
604
- "dtype": "float16",
605
  "format": "f32-to-bf16",
606
  "nbytes": 860160,
607
  "byteOffset": 25470976
608
  }
609
  ],
610
- "md5sum": "629c77a93182ba528f7f574c27a5041e"
611
  },
612
  {
613
  "dataPath": "params_shard_7.bin",
@@ -631,7 +631,7 @@
631
  17920,
632
  48
633
  ],
634
- "dtype": "float16",
635
  "format": "f32-to-bf16",
636
  "nbytes": 1720320,
637
  "byteOffset": 13762560
@@ -641,7 +641,7 @@
641
  "shape": [
642
  1536
643
  ],
644
- "dtype": "float16",
645
  "format": "f32-to-bf16",
646
  "nbytes": 3072,
647
  "byteOffset": 15482880
@@ -651,7 +651,7 @@
651
  "shape": [
652
  2048
653
  ],
654
- "dtype": "float16",
655
  "format": "f32-to-bf16",
656
  "nbytes": 4096,
657
  "byteOffset": 15485952
@@ -673,7 +673,7 @@
673
  2048,
674
  48
675
  ],
676
- "dtype": "float16",
677
  "format": "f32-to-bf16",
678
  "nbytes": 196608,
679
  "byteOffset": 17062912
@@ -695,7 +695,7 @@
695
  1536,
696
  48
697
  ],
698
- "dtype": "float16",
699
  "format": "f32-to-bf16",
700
  "nbytes": 147456,
701
  "byteOffset": 18439168
@@ -705,7 +705,7 @@
705
  "shape": [
706
  1536
707
  ],
708
- "dtype": "float16",
709
  "format": "f32-to-bf16",
710
  "nbytes": 3072,
711
  "byteOffset": 18586624
@@ -727,13 +727,13 @@
727
  1536,
728
  280
729
  ],
730
- "dtype": "float16",
731
  "format": "f32-to-bf16",
732
  "nbytes": 860160,
733
  "byteOffset": 25470976
734
  }
735
  ],
736
- "md5sum": "e876ced97d9e24ff194706ed53c38285"
737
  },
738
  {
739
  "dataPath": "params_shard_8.bin",
@@ -757,7 +757,7 @@
757
  17920,
758
  48
759
  ],
760
- "dtype": "float16",
761
  "format": "f32-to-bf16",
762
  "nbytes": 1720320,
763
  "byteOffset": 13762560
@@ -767,7 +767,7 @@
767
  "shape": [
768
  1536
769
  ],
770
- "dtype": "float16",
771
  "format": "f32-to-bf16",
772
  "nbytes": 3072,
773
  "byteOffset": 15482880
@@ -777,7 +777,7 @@
777
  "shape": [
778
  2048
779
  ],
780
- "dtype": "float16",
781
  "format": "f32-to-bf16",
782
  "nbytes": 4096,
783
  "byteOffset": 15485952
@@ -799,7 +799,7 @@
799
  2048,
800
  48
801
  ],
802
- "dtype": "float16",
803
  "format": "f32-to-bf16",
804
  "nbytes": 196608,
805
  "byteOffset": 17062912
@@ -821,7 +821,7 @@
821
  1536,
822
  48
823
  ],
824
- "dtype": "float16",
825
  "format": "f32-to-bf16",
826
  "nbytes": 147456,
827
  "byteOffset": 18439168
@@ -831,7 +831,7 @@
831
  "shape": [
832
  1536
833
  ],
834
- "dtype": "float16",
835
  "format": "f32-to-bf16",
836
  "nbytes": 3072,
837
  "byteOffset": 18586624
@@ -853,13 +853,13 @@
853
  1536,
854
  280
855
  ],
856
- "dtype": "float16",
857
  "format": "f32-to-bf16",
858
  "nbytes": 860160,
859
  "byteOffset": 25470976
860
  }
861
  ],
862
- "md5sum": "586c54e5d27ef3e1cbc487be2394f0fa"
863
  },
864
  {
865
  "dataPath": "params_shard_9.bin",
@@ -883,7 +883,7 @@
883
  17920,
884
  48
885
  ],
886
- "dtype": "float16",
887
  "format": "f32-to-bf16",
888
  "nbytes": 1720320,
889
  "byteOffset": 13762560
@@ -893,7 +893,7 @@
893
  "shape": [
894
  1536
895
  ],
896
- "dtype": "float16",
897
  "format": "f32-to-bf16",
898
  "nbytes": 3072,
899
  "byteOffset": 15482880
@@ -903,7 +903,7 @@
903
  "shape": [
904
  2048
905
  ],
906
- "dtype": "float16",
907
  "format": "f32-to-bf16",
908
  "nbytes": 4096,
909
  "byteOffset": 15485952
@@ -925,7 +925,7 @@
925
  2048,
926
  48
927
  ],
928
- "dtype": "float16",
929
  "format": "f32-to-bf16",
930
  "nbytes": 196608,
931
  "byteOffset": 17062912
@@ -947,7 +947,7 @@
947
  1536,
948
  48
949
  ],
950
- "dtype": "float16",
951
  "format": "f32-to-bf16",
952
  "nbytes": 147456,
953
  "byteOffset": 18439168
@@ -957,7 +957,7 @@
957
  "shape": [
958
  1536
959
  ],
960
- "dtype": "float16",
961
  "format": "f32-to-bf16",
962
  "nbytes": 3072,
963
  "byteOffset": 18586624
@@ -979,13 +979,13 @@
979
  1536,
980
  280
981
  ],
982
- "dtype": "float16",
983
  "format": "f32-to-bf16",
984
  "nbytes": 860160,
985
  "byteOffset": 25470976
986
  }
987
  ],
988
- "md5sum": "433c3d6ba4414e15f1ff7887f6f7a6dc"
989
  },
990
  {
991
  "dataPath": "params_shard_10.bin",
@@ -1009,7 +1009,7 @@
1009
  17920,
1010
  48
1011
  ],
1012
- "dtype": "float16",
1013
  "format": "f32-to-bf16",
1014
  "nbytes": 1720320,
1015
  "byteOffset": 13762560
@@ -1019,7 +1019,7 @@
1019
  "shape": [
1020
  1536
1021
  ],
1022
- "dtype": "float16",
1023
  "format": "f32-to-bf16",
1024
  "nbytes": 3072,
1025
  "byteOffset": 15482880
@@ -1029,7 +1029,7 @@
1029
  "shape": [
1030
  2048
1031
  ],
1032
- "dtype": "float16",
1033
  "format": "f32-to-bf16",
1034
  "nbytes": 4096,
1035
  "byteOffset": 15485952
@@ -1051,7 +1051,7 @@
1051
  2048,
1052
  48
1053
  ],
1054
- "dtype": "float16",
1055
  "format": "f32-to-bf16",
1056
  "nbytes": 196608,
1057
  "byteOffset": 17062912
@@ -1073,7 +1073,7 @@
1073
  1536,
1074
  48
1075
  ],
1076
- "dtype": "float16",
1077
  "format": "f32-to-bf16",
1078
  "nbytes": 147456,
1079
  "byteOffset": 18439168
@@ -1083,7 +1083,7 @@
1083
  "shape": [
1084
  1536
1085
  ],
1086
- "dtype": "float16",
1087
  "format": "f32-to-bf16",
1088
  "nbytes": 3072,
1089
  "byteOffset": 18586624
@@ -1105,13 +1105,13 @@
1105
  1536,
1106
  280
1107
  ],
1108
- "dtype": "float16",
1109
  "format": "f32-to-bf16",
1110
  "nbytes": 860160,
1111
  "byteOffset": 25470976
1112
  }
1113
  ],
1114
- "md5sum": "5a34b349cdad1743ac9c04a6789318c5"
1115
  },
1116
  {
1117
  "dataPath": "params_shard_11.bin",
@@ -1135,7 +1135,7 @@
1135
  17920,
1136
  48
1137
  ],
1138
- "dtype": "float16",
1139
  "format": "f32-to-bf16",
1140
  "nbytes": 1720320,
1141
  "byteOffset": 13762560
@@ -1145,7 +1145,7 @@
1145
  "shape": [
1146
  1536
1147
  ],
1148
- "dtype": "float16",
1149
  "format": "f32-to-bf16",
1150
  "nbytes": 3072,
1151
  "byteOffset": 15482880
@@ -1155,7 +1155,7 @@
1155
  "shape": [
1156
  2048
1157
  ],
1158
- "dtype": "float16",
1159
  "format": "f32-to-bf16",
1160
  "nbytes": 4096,
1161
  "byteOffset": 15485952
@@ -1177,7 +1177,7 @@
1177
  2048,
1178
  48
1179
  ],
1180
- "dtype": "float16",
1181
  "format": "f32-to-bf16",
1182
  "nbytes": 196608,
1183
  "byteOffset": 17062912
@@ -1199,7 +1199,7 @@
1199
  1536,
1200
  48
1201
  ],
1202
- "dtype": "float16",
1203
  "format": "f32-to-bf16",
1204
  "nbytes": 147456,
1205
  "byteOffset": 18439168
@@ -1209,7 +1209,7 @@
1209
  "shape": [
1210
  1536
1211
  ],
1212
- "dtype": "float16",
1213
  "format": "f32-to-bf16",
1214
  "nbytes": 3072,
1215
  "byteOffset": 18586624
@@ -1231,13 +1231,13 @@
1231
  1536,
1232
  280
1233
  ],
1234
- "dtype": "float16",
1235
  "format": "f32-to-bf16",
1236
  "nbytes": 860160,
1237
  "byteOffset": 25470976
1238
  }
1239
  ],
1240
- "md5sum": "213b770ec9caae8a16b988edac1052c9"
1241
  },
1242
  {
1243
  "dataPath": "params_shard_12.bin",
@@ -1261,7 +1261,7 @@
1261
  17920,
1262
  48
1263
  ],
1264
- "dtype": "float16",
1265
  "format": "f32-to-bf16",
1266
  "nbytes": 1720320,
1267
  "byteOffset": 13762560
@@ -1271,7 +1271,7 @@
1271
  "shape": [
1272
  1536
1273
  ],
1274
- "dtype": "float16",
1275
  "format": "f32-to-bf16",
1276
  "nbytes": 3072,
1277
  "byteOffset": 15482880
@@ -1281,7 +1281,7 @@
1281
  "shape": [
1282
  2048
1283
  ],
1284
- "dtype": "float16",
1285
  "format": "f32-to-bf16",
1286
  "nbytes": 4096,
1287
  "byteOffset": 15485952
@@ -1303,7 +1303,7 @@
1303
  2048,
1304
  48
1305
  ],
1306
- "dtype": "float16",
1307
  "format": "f32-to-bf16",
1308
  "nbytes": 196608,
1309
  "byteOffset": 17062912
@@ -1325,7 +1325,7 @@
1325
  1536,
1326
  48
1327
  ],
1328
- "dtype": "float16",
1329
  "format": "f32-to-bf16",
1330
  "nbytes": 147456,
1331
  "byteOffset": 18439168
@@ -1335,7 +1335,7 @@
1335
  "shape": [
1336
  1536
1337
  ],
1338
- "dtype": "float16",
1339
  "format": "f32-to-bf16",
1340
  "nbytes": 3072,
1341
  "byteOffset": 18586624
@@ -1357,13 +1357,13 @@
1357
  1536,
1358
  280
1359
  ],
1360
- "dtype": "float16",
1361
  "format": "f32-to-bf16",
1362
  "nbytes": 860160,
1363
  "byteOffset": 25470976
1364
  }
1365
  ],
1366
- "md5sum": "1060d21c45674e009aa882fdfa733e97"
1367
  },
1368
  {
1369
  "dataPath": "params_shard_13.bin",
@@ -1387,7 +1387,7 @@
1387
  17920,
1388
  48
1389
  ],
1390
- "dtype": "float16",
1391
  "format": "f32-to-bf16",
1392
  "nbytes": 1720320,
1393
  "byteOffset": 13762560
@@ -1397,7 +1397,7 @@
1397
  "shape": [
1398
  1536
1399
  ],
1400
- "dtype": "float16",
1401
  "format": "f32-to-bf16",
1402
  "nbytes": 3072,
1403
  "byteOffset": 15482880
@@ -1407,7 +1407,7 @@
1407
  "shape": [
1408
  2048
1409
  ],
1410
- "dtype": "float16",
1411
  "format": "f32-to-bf16",
1412
  "nbytes": 4096,
1413
  "byteOffset": 15485952
@@ -1429,7 +1429,7 @@
1429
  2048,
1430
  48
1431
  ],
1432
- "dtype": "float16",
1433
  "format": "f32-to-bf16",
1434
  "nbytes": 196608,
1435
  "byteOffset": 17062912
@@ -1451,7 +1451,7 @@
1451
  1536,
1452
  48
1453
  ],
1454
- "dtype": "float16",
1455
  "format": "f32-to-bf16",
1456
  "nbytes": 147456,
1457
  "byteOffset": 18439168
@@ -1461,7 +1461,7 @@
1461
  "shape": [
1462
  1536
1463
  ],
1464
- "dtype": "float16",
1465
  "format": "f32-to-bf16",
1466
  "nbytes": 3072,
1467
  "byteOffset": 18586624
@@ -1483,13 +1483,13 @@
1483
  1536,
1484
  280
1485
  ],
1486
- "dtype": "float16",
1487
  "format": "f32-to-bf16",
1488
  "nbytes": 860160,
1489
  "byteOffset": 25470976
1490
  }
1491
  ],
1492
- "md5sum": "909cc35a4c07aab9afeb35a1c234a94b"
1493
  },
1494
  {
1495
  "dataPath": "params_shard_14.bin",
@@ -1513,7 +1513,7 @@
1513
  17920,
1514
  48
1515
  ],
1516
- "dtype": "float16",
1517
  "format": "f32-to-bf16",
1518
  "nbytes": 1720320,
1519
  "byteOffset": 13762560
@@ -1523,7 +1523,7 @@
1523
  "shape": [
1524
  1536
1525
  ],
1526
- "dtype": "float16",
1527
  "format": "f32-to-bf16",
1528
  "nbytes": 3072,
1529
  "byteOffset": 15482880
@@ -1533,7 +1533,7 @@
1533
  "shape": [
1534
  2048
1535
  ],
1536
- "dtype": "float16",
1537
  "format": "f32-to-bf16",
1538
  "nbytes": 4096,
1539
  "byteOffset": 15485952
@@ -1555,7 +1555,7 @@
1555
  2048,
1556
  48
1557
  ],
1558
- "dtype": "float16",
1559
  "format": "f32-to-bf16",
1560
  "nbytes": 196608,
1561
  "byteOffset": 17062912
@@ -1577,7 +1577,7 @@
1577
  1536,
1578
  48
1579
  ],
1580
- "dtype": "float16",
1581
  "format": "f32-to-bf16",
1582
  "nbytes": 147456,
1583
  "byteOffset": 18439168
@@ -1587,7 +1587,7 @@
1587
  "shape": [
1588
  1536
1589
  ],
1590
- "dtype": "float16",
1591
  "format": "f32-to-bf16",
1592
  "nbytes": 3072,
1593
  "byteOffset": 18586624
@@ -1609,13 +1609,13 @@
1609
  1536,
1610
  280
1611
  ],
1612
- "dtype": "float16",
1613
  "format": "f32-to-bf16",
1614
  "nbytes": 860160,
1615
  "byteOffset": 25470976
1616
  }
1617
  ],
1618
- "md5sum": "87be97d87ef2698d37068226731c3994"
1619
  },
1620
  {
1621
  "dataPath": "params_shard_15.bin",
@@ -1639,7 +1639,7 @@
1639
  17920,
1640
  48
1641
  ],
1642
- "dtype": "float16",
1643
  "format": "f32-to-bf16",
1644
  "nbytes": 1720320,
1645
  "byteOffset": 13762560
@@ -1649,7 +1649,7 @@
1649
  "shape": [
1650
  1536
1651
  ],
1652
- "dtype": "float16",
1653
  "format": "f32-to-bf16",
1654
  "nbytes": 3072,
1655
  "byteOffset": 15482880
@@ -1659,7 +1659,7 @@
1659
  "shape": [
1660
  2048
1661
  ],
1662
- "dtype": "float16",
1663
  "format": "f32-to-bf16",
1664
  "nbytes": 4096,
1665
  "byteOffset": 15485952
@@ -1681,7 +1681,7 @@
1681
  2048,
1682
  48
1683
  ],
1684
- "dtype": "float16",
1685
  "format": "f32-to-bf16",
1686
  "nbytes": 196608,
1687
  "byteOffset": 17062912
@@ -1703,7 +1703,7 @@
1703
  1536,
1704
  48
1705
  ],
1706
- "dtype": "float16",
1707
  "format": "f32-to-bf16",
1708
  "nbytes": 147456,
1709
  "byteOffset": 18439168
@@ -1713,7 +1713,7 @@
1713
  "shape": [
1714
  1536
1715
  ],
1716
- "dtype": "float16",
1717
  "format": "f32-to-bf16",
1718
  "nbytes": 3072,
1719
  "byteOffset": 18586624
@@ -1735,13 +1735,13 @@
1735
  1536,
1736
  280
1737
  ],
1738
- "dtype": "float16",
1739
  "format": "f32-to-bf16",
1740
  "nbytes": 860160,
1741
  "byteOffset": 25470976
1742
  }
1743
  ],
1744
- "md5sum": "71f068ccd14d34ece134254f1526a3d2"
1745
  },
1746
  {
1747
  "dataPath": "params_shard_16.bin",
@@ -1765,7 +1765,7 @@
1765
  17920,
1766
  48
1767
  ],
1768
- "dtype": "float16",
1769
  "format": "f32-to-bf16",
1770
  "nbytes": 1720320,
1771
  "byteOffset": 13762560
@@ -1775,7 +1775,7 @@
1775
  "shape": [
1776
  1536
1777
  ],
1778
- "dtype": "float16",
1779
  "format": "f32-to-bf16",
1780
  "nbytes": 3072,
1781
  "byteOffset": 15482880
@@ -1785,7 +1785,7 @@
1785
  "shape": [
1786
  2048
1787
  ],
1788
- "dtype": "float16",
1789
  "format": "f32-to-bf16",
1790
  "nbytes": 4096,
1791
  "byteOffset": 15485952
@@ -1807,7 +1807,7 @@
1807
  2048,
1808
  48
1809
  ],
1810
- "dtype": "float16",
1811
  "format": "f32-to-bf16",
1812
  "nbytes": 196608,
1813
  "byteOffset": 17062912
@@ -1829,7 +1829,7 @@
1829
  1536,
1830
  48
1831
  ],
1832
- "dtype": "float16",
1833
  "format": "f32-to-bf16",
1834
  "nbytes": 147456,
1835
  "byteOffset": 18439168
@@ -1839,7 +1839,7 @@
1839
  "shape": [
1840
  1536
1841
  ],
1842
- "dtype": "float16",
1843
  "format": "f32-to-bf16",
1844
  "nbytes": 3072,
1845
  "byteOffset": 18586624
@@ -1861,13 +1861,13 @@
1861
  1536,
1862
  280
1863
  ],
1864
- "dtype": "float16",
1865
  "format": "f32-to-bf16",
1866
  "nbytes": 860160,
1867
  "byteOffset": 25470976
1868
  }
1869
  ],
1870
- "md5sum": "813b3227b3a80948174130d6df4d2cf5"
1871
  },
1872
  {
1873
  "dataPath": "params_shard_17.bin",
@@ -1891,7 +1891,7 @@
1891
  17920,
1892
  48
1893
  ],
1894
- "dtype": "float16",
1895
  "format": "f32-to-bf16",
1896
  "nbytes": 1720320,
1897
  "byteOffset": 13762560
@@ -1901,7 +1901,7 @@
1901
  "shape": [
1902
  1536
1903
  ],
1904
- "dtype": "float16",
1905
  "format": "f32-to-bf16",
1906
  "nbytes": 3072,
1907
  "byteOffset": 15482880
@@ -1911,7 +1911,7 @@
1911
  "shape": [
1912
  2048
1913
  ],
1914
- "dtype": "float16",
1915
  "format": "f32-to-bf16",
1916
  "nbytes": 4096,
1917
  "byteOffset": 15485952
@@ -1933,7 +1933,7 @@
1933
  2048,
1934
  48
1935
  ],
1936
- "dtype": "float16",
1937
  "format": "f32-to-bf16",
1938
  "nbytes": 196608,
1939
  "byteOffset": 17062912
@@ -1955,7 +1955,7 @@
1955
  1536,
1956
  48
1957
  ],
1958
- "dtype": "float16",
1959
  "format": "f32-to-bf16",
1960
  "nbytes": 147456,
1961
  "byteOffset": 18439168
@@ -1965,7 +1965,7 @@
1965
  "shape": [
1966
  1536
1967
  ],
1968
- "dtype": "float16",
1969
  "format": "f32-to-bf16",
1970
  "nbytes": 3072,
1971
  "byteOffset": 18586624
@@ -1987,13 +1987,13 @@
1987
  1536,
1988
  280
1989
  ],
1990
- "dtype": "float16",
1991
  "format": "f32-to-bf16",
1992
  "nbytes": 860160,
1993
  "byteOffset": 25470976
1994
  }
1995
  ],
1996
- "md5sum": "52d232883cc6c86ed14d4bef6d5589eb"
1997
  },
1998
  {
1999
  "dataPath": "params_shard_18.bin",
@@ -2017,7 +2017,7 @@
2017
  17920,
2018
  48
2019
  ],
2020
- "dtype": "float16",
2021
  "format": "f32-to-bf16",
2022
  "nbytes": 1720320,
2023
  "byteOffset": 13762560
@@ -2027,7 +2027,7 @@
2027
  "shape": [
2028
  1536
2029
  ],
2030
- "dtype": "float16",
2031
  "format": "f32-to-bf16",
2032
  "nbytes": 3072,
2033
  "byteOffset": 15482880
@@ -2037,7 +2037,7 @@
2037
  "shape": [
2038
  2048
2039
  ],
2040
- "dtype": "float16",
2041
  "format": "f32-to-bf16",
2042
  "nbytes": 4096,
2043
  "byteOffset": 15485952
@@ -2059,7 +2059,7 @@
2059
  2048,
2060
  48
2061
  ],
2062
- "dtype": "float16",
2063
  "format": "f32-to-bf16",
2064
  "nbytes": 196608,
2065
  "byteOffset": 17062912
@@ -2081,7 +2081,7 @@
2081
  1536,
2082
  48
2083
  ],
2084
- "dtype": "float16",
2085
  "format": "f32-to-bf16",
2086
  "nbytes": 147456,
2087
  "byteOffset": 18439168
@@ -2091,7 +2091,7 @@
2091
  "shape": [
2092
  1536
2093
  ],
2094
- "dtype": "float16",
2095
  "format": "f32-to-bf16",
2096
  "nbytes": 3072,
2097
  "byteOffset": 18586624
@@ -2113,13 +2113,13 @@
2113
  1536,
2114
  280
2115
  ],
2116
- "dtype": "float16",
2117
  "format": "f32-to-bf16",
2118
  "nbytes": 860160,
2119
  "byteOffset": 25470976
2120
  }
2121
  ],
2122
- "md5sum": "58f131fa9e510407fc7b0a97c21553da"
2123
  },
2124
  {
2125
  "dataPath": "params_shard_19.bin",
@@ -2143,7 +2143,7 @@
2143
  17920,
2144
  48
2145
  ],
2146
- "dtype": "float16",
2147
  "format": "f32-to-bf16",
2148
  "nbytes": 1720320,
2149
  "byteOffset": 13762560
@@ -2153,7 +2153,7 @@
2153
  "shape": [
2154
  1536
2155
  ],
2156
- "dtype": "float16",
2157
  "format": "f32-to-bf16",
2158
  "nbytes": 3072,
2159
  "byteOffset": 15482880
@@ -2163,7 +2163,7 @@
2163
  "shape": [
2164
  2048
2165
  ],
2166
- "dtype": "float16",
2167
  "format": "f32-to-bf16",
2168
  "nbytes": 4096,
2169
  "byteOffset": 15485952
@@ -2185,7 +2185,7 @@
2185
  2048,
2186
  48
2187
  ],
2188
- "dtype": "float16",
2189
  "format": "f32-to-bf16",
2190
  "nbytes": 196608,
2191
  "byteOffset": 17062912
@@ -2207,7 +2207,7 @@
2207
  1536,
2208
  48
2209
  ],
2210
- "dtype": "float16",
2211
  "format": "f32-to-bf16",
2212
  "nbytes": 147456,
2213
  "byteOffset": 18439168
@@ -2217,7 +2217,7 @@
2217
  "shape": [
2218
  1536
2219
  ],
2220
- "dtype": "float16",
2221
  "format": "f32-to-bf16",
2222
  "nbytes": 3072,
2223
  "byteOffset": 18586624
@@ -2239,13 +2239,13 @@
2239
  1536,
2240
  280
2241
  ],
2242
- "dtype": "float16",
2243
  "format": "f32-to-bf16",
2244
  "nbytes": 860160,
2245
  "byteOffset": 25470976
2246
  }
2247
  ],
2248
- "md5sum": "3db48f9483ae44df502d9e82f00195b3"
2249
  },
2250
  {
2251
  "dataPath": "params_shard_20.bin",
@@ -2269,7 +2269,7 @@
2269
  17920,
2270
  48
2271
  ],
2272
- "dtype": "float16",
2273
  "format": "f32-to-bf16",
2274
  "nbytes": 1720320,
2275
  "byteOffset": 13762560
@@ -2279,7 +2279,7 @@
2279
  "shape": [
2280
  1536
2281
  ],
2282
- "dtype": "float16",
2283
  "format": "f32-to-bf16",
2284
  "nbytes": 3072,
2285
  "byteOffset": 15482880
@@ -2289,7 +2289,7 @@
2289
  "shape": [
2290
  2048
2291
  ],
2292
- "dtype": "float16",
2293
  "format": "f32-to-bf16",
2294
  "nbytes": 4096,
2295
  "byteOffset": 15485952
@@ -2311,7 +2311,7 @@
2311
  2048,
2312
  48
2313
  ],
2314
- "dtype": "float16",
2315
  "format": "f32-to-bf16",
2316
  "nbytes": 196608,
2317
  "byteOffset": 17062912
@@ -2333,7 +2333,7 @@
2333
  1536,
2334
  48
2335
  ],
2336
- "dtype": "float16",
2337
  "format": "f32-to-bf16",
2338
  "nbytes": 147456,
2339
  "byteOffset": 18439168
@@ -2343,7 +2343,7 @@
2343
  "shape": [
2344
  1536
2345
  ],
2346
- "dtype": "float16",
2347
  "format": "f32-to-bf16",
2348
  "nbytes": 3072,
2349
  "byteOffset": 18586624
@@ -2365,13 +2365,13 @@
2365
  1536,
2366
  280
2367
  ],
2368
- "dtype": "float16",
2369
  "format": "f32-to-bf16",
2370
  "nbytes": 860160,
2371
  "byteOffset": 25470976
2372
  }
2373
  ],
2374
- "md5sum": "f424198c22c3891fa09298641c764185"
2375
  },
2376
  {
2377
  "dataPath": "params_shard_21.bin",
@@ -2395,7 +2395,7 @@
2395
  17920,
2396
  48
2397
  ],
2398
- "dtype": "float16",
2399
  "format": "f32-to-bf16",
2400
  "nbytes": 1720320,
2401
  "byteOffset": 13762560
@@ -2405,7 +2405,7 @@
2405
  "shape": [
2406
  1536
2407
  ],
2408
- "dtype": "float16",
2409
  "format": "f32-to-bf16",
2410
  "nbytes": 3072,
2411
  "byteOffset": 15482880
@@ -2415,7 +2415,7 @@
2415
  "shape": [
2416
  2048
2417
  ],
2418
- "dtype": "float16",
2419
  "format": "f32-to-bf16",
2420
  "nbytes": 4096,
2421
  "byteOffset": 15485952
@@ -2437,7 +2437,7 @@
2437
  2048,
2438
  48
2439
  ],
2440
- "dtype": "float16",
2441
  "format": "f32-to-bf16",
2442
  "nbytes": 196608,
2443
  "byteOffset": 17062912
@@ -2459,7 +2459,7 @@
2459
  1536,
2460
  48
2461
  ],
2462
- "dtype": "float16",
2463
  "format": "f32-to-bf16",
2464
  "nbytes": 147456,
2465
  "byteOffset": 18439168
@@ -2469,7 +2469,7 @@
2469
  "shape": [
2470
  1536
2471
  ],
2472
- "dtype": "float16",
2473
  "format": "f32-to-bf16",
2474
  "nbytes": 3072,
2475
  "byteOffset": 18586624
@@ -2491,13 +2491,13 @@
2491
  1536,
2492
  280
2493
  ],
2494
- "dtype": "float16",
2495
  "format": "f32-to-bf16",
2496
  "nbytes": 860160,
2497
  "byteOffset": 25470976
2498
  }
2499
  ],
2500
- "md5sum": "07dab1c18a55c464ef6b21c36f00bc64"
2501
  },
2502
  {
2503
  "dataPath": "params_shard_22.bin",
@@ -2521,7 +2521,7 @@
2521
  17920,
2522
  48
2523
  ],
2524
- "dtype": "float16",
2525
  "format": "f32-to-bf16",
2526
  "nbytes": 1720320,
2527
  "byteOffset": 13762560
@@ -2531,7 +2531,7 @@
2531
  "shape": [
2532
  1536
2533
  ],
2534
- "dtype": "float16",
2535
  "format": "f32-to-bf16",
2536
  "nbytes": 3072,
2537
  "byteOffset": 15482880
@@ -2541,7 +2541,7 @@
2541
  "shape": [
2542
  2048
2543
  ],
2544
- "dtype": "float16",
2545
  "format": "f32-to-bf16",
2546
  "nbytes": 4096,
2547
  "byteOffset": 15485952
@@ -2563,7 +2563,7 @@
2563
  2048,
2564
  48
2565
  ],
2566
- "dtype": "float16",
2567
  "format": "f32-to-bf16",
2568
  "nbytes": 196608,
2569
  "byteOffset": 17062912
@@ -2585,7 +2585,7 @@
2585
  1536,
2586
  48
2587
  ],
2588
- "dtype": "float16",
2589
  "format": "f32-to-bf16",
2590
  "nbytes": 147456,
2591
  "byteOffset": 18439168
@@ -2595,7 +2595,7 @@
2595
  "shape": [
2596
  1536
2597
  ],
2598
- "dtype": "float16",
2599
  "format": "f32-to-bf16",
2600
  "nbytes": 3072,
2601
  "byteOffset": 18586624
@@ -2617,13 +2617,13 @@
2617
  1536,
2618
  280
2619
  ],
2620
- "dtype": "float16",
2621
  "format": "f32-to-bf16",
2622
  "nbytes": 860160,
2623
  "byteOffset": 25470976
2624
  }
2625
  ],
2626
- "md5sum": "44c0bf0e631e366ba490b6ea9c548bef"
2627
  },
2628
  {
2629
  "dataPath": "params_shard_23.bin",
@@ -2647,7 +2647,7 @@
2647
  17920,
2648
  48
2649
  ],
2650
- "dtype": "float16",
2651
  "format": "f32-to-bf16",
2652
  "nbytes": 1720320,
2653
  "byteOffset": 13762560
@@ -2657,7 +2657,7 @@
2657
  "shape": [
2658
  1536
2659
  ],
2660
- "dtype": "float16",
2661
  "format": "f32-to-bf16",
2662
  "nbytes": 3072,
2663
  "byteOffset": 15482880
@@ -2667,7 +2667,7 @@
2667
  "shape": [
2668
  2048
2669
  ],
2670
- "dtype": "float16",
2671
  "format": "f32-to-bf16",
2672
  "nbytes": 4096,
2673
  "byteOffset": 15485952
@@ -2689,7 +2689,7 @@
2689
  2048,
2690
  48
2691
  ],
2692
- "dtype": "float16",
2693
  "format": "f32-to-bf16",
2694
  "nbytes": 196608,
2695
  "byteOffset": 17062912
@@ -2711,7 +2711,7 @@
2711
  1536,
2712
  48
2713
  ],
2714
- "dtype": "float16",
2715
  "format": "f32-to-bf16",
2716
  "nbytes": 147456,
2717
  "byteOffset": 18439168
@@ -2721,7 +2721,7 @@
2721
  "shape": [
2722
  1536
2723
  ],
2724
- "dtype": "float16",
2725
  "format": "f32-to-bf16",
2726
  "nbytes": 3072,
2727
  "byteOffset": 18586624
@@ -2743,13 +2743,13 @@
2743
  1536,
2744
  280
2745
  ],
2746
- "dtype": "float16",
2747
  "format": "f32-to-bf16",
2748
  "nbytes": 860160,
2749
  "byteOffset": 25470976
2750
  }
2751
  ],
2752
- "md5sum": "dfd5f83222f16e21e6d52fbf1fd7b000"
2753
  },
2754
  {
2755
  "dataPath": "params_shard_24.bin",
@@ -2773,7 +2773,7 @@
2773
  17920,
2774
  48
2775
  ],
2776
- "dtype": "float16",
2777
  "format": "f32-to-bf16",
2778
  "nbytes": 1720320,
2779
  "byteOffset": 13762560
@@ -2783,7 +2783,7 @@
2783
  "shape": [
2784
  1536
2785
  ],
2786
- "dtype": "float16",
2787
  "format": "f32-to-bf16",
2788
  "nbytes": 3072,
2789
  "byteOffset": 15482880
@@ -2793,7 +2793,7 @@
2793
  "shape": [
2794
  2048
2795
  ],
2796
- "dtype": "float16",
2797
  "format": "f32-to-bf16",
2798
  "nbytes": 4096,
2799
  "byteOffset": 15485952
@@ -2815,7 +2815,7 @@
2815
  2048,
2816
  48
2817
  ],
2818
- "dtype": "float16",
2819
  "format": "f32-to-bf16",
2820
  "nbytes": 196608,
2821
  "byteOffset": 17062912
@@ -2837,7 +2837,7 @@
2837
  1536,
2838
  48
2839
  ],
2840
- "dtype": "float16",
2841
  "format": "f32-to-bf16",
2842
  "nbytes": 147456,
2843
  "byteOffset": 18439168
@@ -2847,7 +2847,7 @@
2847
  "shape": [
2848
  1536
2849
  ],
2850
- "dtype": "float16",
2851
  "format": "f32-to-bf16",
2852
  "nbytes": 3072,
2853
  "byteOffset": 18586624
@@ -2869,13 +2869,13 @@
2869
  1536,
2870
  280
2871
  ],
2872
- "dtype": "float16",
2873
  "format": "f32-to-bf16",
2874
  "nbytes": 860160,
2875
  "byteOffset": 25470976
2876
  }
2877
  ],
2878
- "md5sum": "84afd98a1578859faf792451e46cb8af"
2879
  },
2880
  {
2881
  "dataPath": "params_shard_25.bin",
@@ -2899,7 +2899,7 @@
2899
  17920,
2900
  48
2901
  ],
2902
- "dtype": "float16",
2903
  "format": "f32-to-bf16",
2904
  "nbytes": 1720320,
2905
  "byteOffset": 13762560
@@ -2909,7 +2909,7 @@
2909
  "shape": [
2910
  1536
2911
  ],
2912
- "dtype": "float16",
2913
  "format": "f32-to-bf16",
2914
  "nbytes": 3072,
2915
  "byteOffset": 15482880
@@ -2919,7 +2919,7 @@
2919
  "shape": [
2920
  2048
2921
  ],
2922
- "dtype": "float16",
2923
  "format": "f32-to-bf16",
2924
  "nbytes": 4096,
2925
  "byteOffset": 15485952
@@ -2941,7 +2941,7 @@
2941
  2048,
2942
  48
2943
  ],
2944
- "dtype": "float16",
2945
  "format": "f32-to-bf16",
2946
  "nbytes": 196608,
2947
  "byteOffset": 17062912
@@ -2963,7 +2963,7 @@
2963
  1536,
2964
  48
2965
  ],
2966
- "dtype": "float16",
2967
  "format": "f32-to-bf16",
2968
  "nbytes": 147456,
2969
  "byteOffset": 18439168
@@ -2973,7 +2973,7 @@
2973
  "shape": [
2974
  1536
2975
  ],
2976
- "dtype": "float16",
2977
  "format": "f32-to-bf16",
2978
  "nbytes": 3072,
2979
  "byteOffset": 18586624
@@ -2995,13 +2995,13 @@
2995
  1536,
2996
  280
2997
  ],
2998
- "dtype": "float16",
2999
  "format": "f32-to-bf16",
3000
  "nbytes": 860160,
3001
  "byteOffset": 25470976
3002
  }
3003
  ],
3004
- "md5sum": "e80fb8e1b3c747052052742c76b1062d"
3005
  },
3006
  {
3007
  "dataPath": "params_shard_26.bin",
@@ -3025,7 +3025,7 @@
3025
  17920,
3026
  48
3027
  ],
3028
- "dtype": "float16",
3029
  "format": "f32-to-bf16",
3030
  "nbytes": 1720320,
3031
  "byteOffset": 13762560
@@ -3035,7 +3035,7 @@
3035
  "shape": [
3036
  1536
3037
  ],
3038
- "dtype": "float16",
3039
  "format": "f32-to-bf16",
3040
  "nbytes": 3072,
3041
  "byteOffset": 15482880
@@ -3045,7 +3045,7 @@
3045
  "shape": [
3046
  2048
3047
  ],
3048
- "dtype": "float16",
3049
  "format": "f32-to-bf16",
3050
  "nbytes": 4096,
3051
  "byteOffset": 15485952
@@ -3067,7 +3067,7 @@
3067
  2048,
3068
  48
3069
  ],
3070
- "dtype": "float16",
3071
  "format": "f32-to-bf16",
3072
  "nbytes": 196608,
3073
  "byteOffset": 17062912
@@ -3089,7 +3089,7 @@
3089
  1536,
3090
  48
3091
  ],
3092
- "dtype": "float16",
3093
  "format": "f32-to-bf16",
3094
  "nbytes": 147456,
3095
  "byteOffset": 18439168
@@ -3099,7 +3099,7 @@
3099
  "shape": [
3100
  1536
3101
  ],
3102
- "dtype": "float16",
3103
  "format": "f32-to-bf16",
3104
  "nbytes": 3072,
3105
  "byteOffset": 18586624
@@ -3121,13 +3121,13 @@
3121
  1536,
3122
  280
3123
  ],
3124
- "dtype": "float16",
3125
  "format": "f32-to-bf16",
3126
  "nbytes": 860160,
3127
  "byteOffset": 25470976
3128
  }
3129
  ],
3130
- "md5sum": "99d116b46fdb2df517ad5e6ba222ae51"
3131
  },
3132
  {
3133
  "dataPath": "params_shard_27.bin",
@@ -3151,7 +3151,7 @@
3151
  17920,
3152
  48
3153
  ],
3154
- "dtype": "float16",
3155
  "format": "f32-to-bf16",
3156
  "nbytes": 1720320,
3157
  "byteOffset": 13762560
@@ -3161,7 +3161,7 @@
3161
  "shape": [
3162
  1536
3163
  ],
3164
- "dtype": "float16",
3165
  "format": "f32-to-bf16",
3166
  "nbytes": 3072,
3167
  "byteOffset": 15482880
@@ -3171,7 +3171,7 @@
3171
  "shape": [
3172
  2048
3173
  ],
3174
- "dtype": "float16",
3175
  "format": "f32-to-bf16",
3176
  "nbytes": 4096,
3177
  "byteOffset": 15485952
@@ -3193,7 +3193,7 @@
3193
  2048,
3194
  48
3195
  ],
3196
- "dtype": "float16",
3197
  "format": "f32-to-bf16",
3198
  "nbytes": 196608,
3199
  "byteOffset": 17062912
@@ -3215,7 +3215,7 @@
3215
  1536,
3216
  48
3217
  ],
3218
- "dtype": "float16",
3219
  "format": "f32-to-bf16",
3220
  "nbytes": 147456,
3221
  "byteOffset": 18439168
@@ -3225,7 +3225,7 @@
3225
  "shape": [
3226
  1536
3227
  ],
3228
- "dtype": "float16",
3229
  "format": "f32-to-bf16",
3230
  "nbytes": 3072,
3231
  "byteOffset": 18586624
@@ -3247,13 +3247,13 @@
3247
  1536,
3248
  280
3249
  ],
3250
- "dtype": "float16",
3251
  "format": "f32-to-bf16",
3252
  "nbytes": 860160,
3253
  "byteOffset": 25470976
3254
  }
3255
  ],
3256
- "md5sum": "6e72108d5d3e46b06a1caae71c7f36a9"
3257
  },
3258
  {
3259
  "dataPath": "params_shard_28.bin",
@@ -3277,7 +3277,7 @@
3277
  17920,
3278
  48
3279
  ],
3280
- "dtype": "float16",
3281
  "format": "f32-to-bf16",
3282
  "nbytes": 1720320,
3283
  "byteOffset": 13762560
@@ -3287,7 +3287,7 @@
3287
  "shape": [
3288
  1536
3289
  ],
3290
- "dtype": "float16",
3291
  "format": "f32-to-bf16",
3292
  "nbytes": 3072,
3293
  "byteOffset": 15482880
@@ -3297,7 +3297,7 @@
3297
  "shape": [
3298
  2048
3299
  ],
3300
- "dtype": "float16",
3301
  "format": "f32-to-bf16",
3302
  "nbytes": 4096,
3303
  "byteOffset": 15485952
@@ -3319,7 +3319,7 @@
3319
  2048,
3320
  48
3321
  ],
3322
- "dtype": "float16",
3323
  "format": "f32-to-bf16",
3324
  "nbytes": 196608,
3325
  "byteOffset": 17062912
@@ -3341,7 +3341,7 @@
3341
  1536,
3342
  48
3343
  ],
3344
- "dtype": "float16",
3345
  "format": "f32-to-bf16",
3346
  "nbytes": 147456,
3347
  "byteOffset": 18439168
@@ -3351,7 +3351,7 @@
3351
  "shape": [
3352
  1536
3353
  ],
3354
- "dtype": "float16",
3355
  "format": "f32-to-bf16",
3356
  "nbytes": 3072,
3357
  "byteOffset": 18586624
@@ -3373,13 +3373,13 @@
3373
  1536,
3374
  280
3375
  ],
3376
- "dtype": "float16",
3377
  "format": "f32-to-bf16",
3378
  "nbytes": 860160,
3379
  "byteOffset": 25470976
3380
  }
3381
  ],
3382
- "md5sum": "fb5d17d4e512b052b49fd8ab7c852b5b"
3383
  },
3384
  {
3385
  "dataPath": "params_shard_29.bin",
@@ -3403,7 +3403,7 @@
3403
  17920,
3404
  48
3405
  ],
3406
- "dtype": "float16",
3407
  "format": "f32-to-bf16",
3408
  "nbytes": 1720320,
3409
  "byteOffset": 13762560
@@ -3413,7 +3413,7 @@
3413
  "shape": [
3414
  1536
3415
  ],
3416
- "dtype": "float16",
3417
  "format": "f32-to-bf16",
3418
  "nbytes": 3072,
3419
  "byteOffset": 15482880
@@ -3423,7 +3423,7 @@
3423
  "shape": [
3424
  2048
3425
  ],
3426
- "dtype": "float16",
3427
  "format": "f32-to-bf16",
3428
  "nbytes": 4096,
3429
  "byteOffset": 15485952
@@ -3445,7 +3445,7 @@
3445
  2048,
3446
  48
3447
  ],
3448
- "dtype": "float16",
3449
  "format": "f32-to-bf16",
3450
  "nbytes": 196608,
3451
  "byteOffset": 17062912
@@ -3467,7 +3467,7 @@
3467
  1536,
3468
  48
3469
  ],
3470
- "dtype": "float16",
3471
  "format": "f32-to-bf16",
3472
  "nbytes": 147456,
3473
  "byteOffset": 18439168
@@ -3477,7 +3477,7 @@
3477
  "shape": [
3478
  1536
3479
  ],
3480
- "dtype": "float16",
3481
  "format": "f32-to-bf16",
3482
  "nbytes": 3072,
3483
  "byteOffset": 18586624
@@ -3499,13 +3499,13 @@
3499
  1536,
3500
  280
3501
  ],
3502
- "dtype": "float16",
3503
  "format": "f32-to-bf16",
3504
  "nbytes": 860160,
3505
  "byteOffset": 25470976
3506
  }
3507
  ],
3508
- "md5sum": "8d4e6597b7773c2d20af82e5d4a11844"
3509
  },
3510
  {
3511
  "dataPath": "params_shard_30.bin",
@@ -3529,7 +3529,7 @@
3529
  17920,
3530
  48
3531
  ],
3532
- "dtype": "float16",
3533
  "format": "f32-to-bf16",
3534
  "nbytes": 1720320,
3535
  "byteOffset": 13762560
@@ -3539,7 +3539,7 @@
3539
  "shape": [
3540
  1536
3541
  ],
3542
- "dtype": "float16",
3543
  "format": "f32-to-bf16",
3544
  "nbytes": 3072,
3545
  "byteOffset": 15482880
@@ -3549,7 +3549,7 @@
3549
  "shape": [
3550
  2048
3551
  ],
3552
- "dtype": "float16",
3553
  "format": "f32-to-bf16",
3554
  "nbytes": 4096,
3555
  "byteOffset": 15485952
@@ -3571,7 +3571,7 @@
3571
  2048,
3572
  48
3573
  ],
3574
- "dtype": "float16",
3575
  "format": "f32-to-bf16",
3576
  "nbytes": 196608,
3577
  "byteOffset": 17062912
@@ -3593,7 +3593,7 @@
3593
  1536,
3594
  48
3595
  ],
3596
- "dtype": "float16",
3597
  "format": "f32-to-bf16",
3598
  "nbytes": 147456,
3599
  "byteOffset": 18439168
@@ -3603,13 +3603,13 @@
3603
  "shape": [
3604
  1536
3605
  ],
3606
- "dtype": "float16",
3607
  "format": "f32-to-bf16",
3608
  "nbytes": 3072,
3609
  "byteOffset": 18586624
3610
  }
3611
  ],
3612
- "md5sum": "f2f4c5c3d83aaa1d953bcc146de45dcf"
3613
  }
3614
  ]
3615
  }
 
1
  {
2
  "metadata": {
3
  "ParamSize": 313,
4
+ "ParamBytes": 1111169024.0,
5
+ "BitsPerParam": 5.002201462167321
6
  },
7
  "records": [
8
  {
 
22
  "byteOffset": 0
23
  }
24
  ],
25
+ "md5sum": "3eba7944239eea590b63e87f00016a6b"
26
  },
27
  {
28
  "dataPath": "params_shard_1.bin",
 
41
  "byteOffset": 0
42
  }
43
  ],
44
+ "md5sum": "be8d442fc5234135620521550a8148fa"
45
  },
46
  {
47
  "dataPath": "params_shard_2.bin",
 
54
  151936,
55
  48
56
  ],
57
+ "dtype": "float32",
58
  "format": "f32-to-bf16",
59
  "nbytes": 14585856,
60
  "byteOffset": 0
 
65
  151936,
66
  48
67
  ],
68
+ "dtype": "float32",
69
  "format": "f32-to-bf16",
70
  "nbytes": 14585856,
71
  "byteOffset": 14585856
 
75
  "shape": [
76
  1536
77
  ],
78
+ "dtype": "float32",
79
  "format": "f32-to-bf16",
80
  "nbytes": 3072,
81
  "byteOffset": 29171712
82
  }
83
  ],
84
+ "md5sum": "51e65235b4e65bd14f51a603e8ef7b49"
85
  },
86
  {
87
  "dataPath": "params_shard_3.bin",
 
105
  1536,
106
  280
107
  ],
108
+ "dtype": "float32",
109
  "format": "f32-to-bf16",
110
  "nbytes": 860160,
111
  "byteOffset": 6881280
 
127
  17920,
128
  48
129
  ],
130
+ "dtype": "float32",
131
  "format": "f32-to-bf16",
132
  "nbytes": 1720320,
133
  "byteOffset": 21504000
 
137
  "shape": [
138
  1536
139
  ],
140
+ "dtype": "float32",
141
  "format": "f32-to-bf16",
142
  "nbytes": 3072,
143
  "byteOffset": 23224320
 
147
  "shape": [
148
  2048
149
  ],
150
+ "dtype": "float32",
151
  "format": "f32-to-bf16",
152
  "nbytes": 4096,
153
  "byteOffset": 23227392
 
169
  2048,
170
  48
171
  ],
172
+ "dtype": "float32",
173
  "format": "f32-to-bf16",
174
  "nbytes": 196608,
175
  "byteOffset": 24804352
 
191
  1536,
192
  48
193
  ],
194
+ "dtype": "float32",
195
  "format": "f32-to-bf16",
196
  "nbytes": 147456,
197
  "byteOffset": 26180608
 
201
  "shape": [
202
  1536
203
  ],
204
+ "dtype": "float32",
205
  "format": "f32-to-bf16",
206
  "nbytes": 3072,
207
  "byteOffset": 26328064
 
218
  "byteOffset": 26331136
219
  }
220
  ],
221
+ "md5sum": "59cea6a143c3e50522e6a7ab56fd1302"
222
  },
223
  {
224
  "dataPath": "params_shard_4.bin",
 
231
  1536,
232
  280
233
  ],
234
+ "dtype": "float32",
235
  "format": "f32-to-bf16",
236
  "nbytes": 860160,
237
  "byteOffset": 0
 
253
  17920,
254
  48
255
  ],
256
+ "dtype": "float32",
257
  "format": "f32-to-bf16",
258
  "nbytes": 1720320,
259
  "byteOffset": 14622720
 
263
  "shape": [
264
  1536
265
  ],
266
+ "dtype": "float32",
267
  "format": "f32-to-bf16",
268
  "nbytes": 3072,
269
  "byteOffset": 16343040
 
273
  "shape": [
274
  2048
275
  ],
276
+ "dtype": "float32",
277
  "format": "f32-to-bf16",
278
  "nbytes": 4096,
279
  "byteOffset": 16346112
 
295
  2048,
296
  48
297
  ],
298
+ "dtype": "float32",
299
  "format": "f32-to-bf16",
300
  "nbytes": 196608,
301
  "byteOffset": 17923072
 
317
  1536,
318
  48
319
  ],
320
+ "dtype": "float32",
321
  "format": "f32-to-bf16",
322
  "nbytes": 147456,
323
  "byteOffset": 19299328
 
327
  "shape": [
328
  1536
329
  ],
330
+ "dtype": "float32",
331
  "format": "f32-to-bf16",
332
  "nbytes": 3072,
333
  "byteOffset": 19446784
 
349
  1536,
350
  280
351
  ],
352
+ "dtype": "float32",
353
  "format": "f32-to-bf16",
354
  "nbytes": 860160,
355
  "byteOffset": 26331136
356
  }
357
  ],
358
+ "md5sum": "13283f546f5e1640e0d179f91c737060"
359
  },
360
  {
361
  "dataPath": "params_shard_5.bin",
 
379
  17920,
380
  48
381
  ],
382
+ "dtype": "float32",
383
  "format": "f32-to-bf16",
384
  "nbytes": 1720320,
385
  "byteOffset": 13762560
 
389
  "shape": [
390
  1536
391
  ],
392
+ "dtype": "float32",
393
  "format": "f32-to-bf16",
394
  "nbytes": 3072,
395
  "byteOffset": 15482880
 
399
  "shape": [
400
  2048
401
  ],
402
+ "dtype": "float32",
403
  "format": "f32-to-bf16",
404
  "nbytes": 4096,
405
  "byteOffset": 15485952
 
421
  2048,
422
  48
423
  ],
424
+ "dtype": "float32",
425
  "format": "f32-to-bf16",
426
  "nbytes": 196608,
427
  "byteOffset": 17062912
 
443
  1536,
444
  48
445
  ],
446
+ "dtype": "float32",
447
  "format": "f32-to-bf16",
448
  "nbytes": 147456,
449
  "byteOffset": 18439168
 
453
  "shape": [
454
  1536
455
  ],
456
+ "dtype": "float32",
457
  "format": "f32-to-bf16",
458
  "nbytes": 3072,
459
  "byteOffset": 18586624
 
475
  1536,
476
  280
477
  ],
478
+ "dtype": "float32",
479
  "format": "f32-to-bf16",
480
  "nbytes": 860160,
481
  "byteOffset": 25470976
482
  }
483
  ],
484
+ "md5sum": "f80a070c11451222f8169d453336a19c"
485
  },
486
  {
487
  "dataPath": "params_shard_6.bin",
 
505
  17920,
506
  48
507
  ],
508
+ "dtype": "float32",
509
  "format": "f32-to-bf16",
510
  "nbytes": 1720320,
511
  "byteOffset": 13762560
 
515
  "shape": [
516
  1536
517
  ],
518
+ "dtype": "float32",
519
  "format": "f32-to-bf16",
520
  "nbytes": 3072,
521
  "byteOffset": 15482880
 
525
  "shape": [
526
  2048
527
  ],
528
+ "dtype": "float32",
529
  "format": "f32-to-bf16",
530
  "nbytes": 4096,
531
  "byteOffset": 15485952
 
547
  2048,
548
  48
549
  ],
550
+ "dtype": "float32",
551
  "format": "f32-to-bf16",
552
  "nbytes": 196608,
553
  "byteOffset": 17062912
 
569
  1536,
570
  48
571
  ],
572
+ "dtype": "float32",
573
  "format": "f32-to-bf16",
574
  "nbytes": 147456,
575
  "byteOffset": 18439168
 
579
  "shape": [
580
  1536
581
  ],
582
+ "dtype": "float32",
583
  "format": "f32-to-bf16",
584
  "nbytes": 3072,
585
  "byteOffset": 18586624
 
601
  1536,
602
  280
603
  ],
604
+ "dtype": "float32",
605
  "format": "f32-to-bf16",
606
  "nbytes": 860160,
607
  "byteOffset": 25470976
608
  }
609
  ],
610
+ "md5sum": "114d2917404e99a37c39aacfa57a9a50"
611
  },
612
  {
613
  "dataPath": "params_shard_7.bin",
 
631
  17920,
632
  48
633
  ],
634
+ "dtype": "float32",
635
  "format": "f32-to-bf16",
636
  "nbytes": 1720320,
637
  "byteOffset": 13762560
 
641
  "shape": [
642
  1536
643
  ],
644
+ "dtype": "float32",
645
  "format": "f32-to-bf16",
646
  "nbytes": 3072,
647
  "byteOffset": 15482880
 
651
  "shape": [
652
  2048
653
  ],
654
+ "dtype": "float32",
655
  "format": "f32-to-bf16",
656
  "nbytes": 4096,
657
  "byteOffset": 15485952
 
673
  2048,
674
  48
675
  ],
676
+ "dtype": "float32",
677
  "format": "f32-to-bf16",
678
  "nbytes": 196608,
679
  "byteOffset": 17062912
 
695
  1536,
696
  48
697
  ],
698
+ "dtype": "float32",
699
  "format": "f32-to-bf16",
700
  "nbytes": 147456,
701
  "byteOffset": 18439168
 
705
  "shape": [
706
  1536
707
  ],
708
+ "dtype": "float32",
709
  "format": "f32-to-bf16",
710
  "nbytes": 3072,
711
  "byteOffset": 18586624
 
727
  1536,
728
  280
729
  ],
730
+ "dtype": "float32",
731
  "format": "f32-to-bf16",
732
  "nbytes": 860160,
733
  "byteOffset": 25470976
734
  }
735
  ],
736
+ "md5sum": "dc3b5e347d2aba0026bc6cc0dcf4b005"
737
  },
738
  {
739
  "dataPath": "params_shard_8.bin",
 
757
  17920,
758
  48
759
  ],
760
+ "dtype": "float32",
761
  "format": "f32-to-bf16",
762
  "nbytes": 1720320,
763
  "byteOffset": 13762560
 
767
  "shape": [
768
  1536
769
  ],
770
+ "dtype": "float32",
771
  "format": "f32-to-bf16",
772
  "nbytes": 3072,
773
  "byteOffset": 15482880
 
777
  "shape": [
778
  2048
779
  ],
780
+ "dtype": "float32",
781
  "format": "f32-to-bf16",
782
  "nbytes": 4096,
783
  "byteOffset": 15485952
 
799
  2048,
800
  48
801
  ],
802
+ "dtype": "float32",
803
  "format": "f32-to-bf16",
804
  "nbytes": 196608,
805
  "byteOffset": 17062912
 
821
  1536,
822
  48
823
  ],
824
+ "dtype": "float32",
825
  "format": "f32-to-bf16",
826
  "nbytes": 147456,
827
  "byteOffset": 18439168
 
831
  "shape": [
832
  1536
833
  ],
834
+ "dtype": "float32",
835
  "format": "f32-to-bf16",
836
  "nbytes": 3072,
837
  "byteOffset": 18586624
 
853
  1536,
854
  280
855
  ],
856
+ "dtype": "float32",
857
  "format": "f32-to-bf16",
858
  "nbytes": 860160,
859
  "byteOffset": 25470976
860
  }
861
  ],
862
+ "md5sum": "60e7284515bb4c2999432289d45839c4"
863
  },
864
  {
865
  "dataPath": "params_shard_9.bin",
 
883
  17920,
884
  48
885
  ],
886
+ "dtype": "float32",
887
  "format": "f32-to-bf16",
888
  "nbytes": 1720320,
889
  "byteOffset": 13762560
 
893
  "shape": [
894
  1536
895
  ],
896
+ "dtype": "float32",
897
  "format": "f32-to-bf16",
898
  "nbytes": 3072,
899
  "byteOffset": 15482880
 
903
  "shape": [
904
  2048
905
  ],
906
+ "dtype": "float32",
907
  "format": "f32-to-bf16",
908
  "nbytes": 4096,
909
  "byteOffset": 15485952
 
925
  2048,
926
  48
927
  ],
928
+ "dtype": "float32",
929
  "format": "f32-to-bf16",
930
  "nbytes": 196608,
931
  "byteOffset": 17062912
 
947
  1536,
948
  48
949
  ],
950
+ "dtype": "float32",
951
  "format": "f32-to-bf16",
952
  "nbytes": 147456,
953
  "byteOffset": 18439168
 
957
  "shape": [
958
  1536
959
  ],
960
+ "dtype": "float32",
961
  "format": "f32-to-bf16",
962
  "nbytes": 3072,
963
  "byteOffset": 18586624
 
979
  1536,
980
  280
981
  ],
982
+ "dtype": "float32",
983
  "format": "f32-to-bf16",
984
  "nbytes": 860160,
985
  "byteOffset": 25470976
986
  }
987
  ],
988
+ "md5sum": "f48e561b8d2b76519c23c5db3e8f6f16"
989
  },
990
  {
991
  "dataPath": "params_shard_10.bin",
 
1009
  17920,
1010
  48
1011
  ],
1012
+ "dtype": "float32",
1013
  "format": "f32-to-bf16",
1014
  "nbytes": 1720320,
1015
  "byteOffset": 13762560
 
1019
  "shape": [
1020
  1536
1021
  ],
1022
+ "dtype": "float32",
1023
  "format": "f32-to-bf16",
1024
  "nbytes": 3072,
1025
  "byteOffset": 15482880
 
1029
  "shape": [
1030
  2048
1031
  ],
1032
+ "dtype": "float32",
1033
  "format": "f32-to-bf16",
1034
  "nbytes": 4096,
1035
  "byteOffset": 15485952
 
1051
  2048,
1052
  48
1053
  ],
1054
+ "dtype": "float32",
1055
  "format": "f32-to-bf16",
1056
  "nbytes": 196608,
1057
  "byteOffset": 17062912
 
1073
  1536,
1074
  48
1075
  ],
1076
+ "dtype": "float32",
1077
  "format": "f32-to-bf16",
1078
  "nbytes": 147456,
1079
  "byteOffset": 18439168
 
1083
  "shape": [
1084
  1536
1085
  ],
1086
+ "dtype": "float32",
1087
  "format": "f32-to-bf16",
1088
  "nbytes": 3072,
1089
  "byteOffset": 18586624
 
1105
  1536,
1106
  280
1107
  ],
1108
+ "dtype": "float32",
1109
  "format": "f32-to-bf16",
1110
  "nbytes": 860160,
1111
  "byteOffset": 25470976
1112
  }
1113
  ],
1114
+ "md5sum": "252c5013974cfddd0dbba30e029f877e"
1115
  },
1116
  {
1117
  "dataPath": "params_shard_11.bin",
 
1135
  17920,
1136
  48
1137
  ],
1138
+ "dtype": "float32",
1139
  "format": "f32-to-bf16",
1140
  "nbytes": 1720320,
1141
  "byteOffset": 13762560
 
1145
  "shape": [
1146
  1536
1147
  ],
1148
+ "dtype": "float32",
1149
  "format": "f32-to-bf16",
1150
  "nbytes": 3072,
1151
  "byteOffset": 15482880
 
1155
  "shape": [
1156
  2048
1157
  ],
1158
+ "dtype": "float32",
1159
  "format": "f32-to-bf16",
1160
  "nbytes": 4096,
1161
  "byteOffset": 15485952
 
1177
  2048,
1178
  48
1179
  ],
1180
+ "dtype": "float32",
1181
  "format": "f32-to-bf16",
1182
  "nbytes": 196608,
1183
  "byteOffset": 17062912
 
1199
  1536,
1200
  48
1201
  ],
1202
+ "dtype": "float32",
1203
  "format": "f32-to-bf16",
1204
  "nbytes": 147456,
1205
  "byteOffset": 18439168
 
1209
  "shape": [
1210
  1536
1211
  ],
1212
+ "dtype": "float32",
1213
  "format": "f32-to-bf16",
1214
  "nbytes": 3072,
1215
  "byteOffset": 18586624
 
1231
  1536,
1232
  280
1233
  ],
1234
+ "dtype": "float32",
1235
  "format": "f32-to-bf16",
1236
  "nbytes": 860160,
1237
  "byteOffset": 25470976
1238
  }
1239
  ],
1240
+ "md5sum": "390cb82a590d93b12129b8d3c50f73f1"
1241
  },
1242
  {
1243
  "dataPath": "params_shard_12.bin",
 
1261
  17920,
1262
  48
1263
  ],
1264
+ "dtype": "float32",
1265
  "format": "f32-to-bf16",
1266
  "nbytes": 1720320,
1267
  "byteOffset": 13762560
 
1271
  "shape": [
1272
  1536
1273
  ],
1274
+ "dtype": "float32",
1275
  "format": "f32-to-bf16",
1276
  "nbytes": 3072,
1277
  "byteOffset": 15482880
 
1281
  "shape": [
1282
  2048
1283
  ],
1284
+ "dtype": "float32",
1285
  "format": "f32-to-bf16",
1286
  "nbytes": 4096,
1287
  "byteOffset": 15485952
 
1303
  2048,
1304
  48
1305
  ],
1306
+ "dtype": "float32",
1307
  "format": "f32-to-bf16",
1308
  "nbytes": 196608,
1309
  "byteOffset": 17062912
 
1325
  1536,
1326
  48
1327
  ],
1328
+ "dtype": "float32",
1329
  "format": "f32-to-bf16",
1330
  "nbytes": 147456,
1331
  "byteOffset": 18439168
 
1335
  "shape": [
1336
  1536
1337
  ],
1338
+ "dtype": "float32",
1339
  "format": "f32-to-bf16",
1340
  "nbytes": 3072,
1341
  "byteOffset": 18586624
 
1357
  1536,
1358
  280
1359
  ],
1360
+ "dtype": "float32",
1361
  "format": "f32-to-bf16",
1362
  "nbytes": 860160,
1363
  "byteOffset": 25470976
1364
  }
1365
  ],
1366
+ "md5sum": "a3495d635ea3c53c9b0bbbcef749ceb8"
1367
  },
1368
  {
1369
  "dataPath": "params_shard_13.bin",
 
1387
  17920,
1388
  48
1389
  ],
1390
+ "dtype": "float32",
1391
  "format": "f32-to-bf16",
1392
  "nbytes": 1720320,
1393
  "byteOffset": 13762560
 
1397
  "shape": [
1398
  1536
1399
  ],
1400
+ "dtype": "float32",
1401
  "format": "f32-to-bf16",
1402
  "nbytes": 3072,
1403
  "byteOffset": 15482880
 
1407
  "shape": [
1408
  2048
1409
  ],
1410
+ "dtype": "float32",
1411
  "format": "f32-to-bf16",
1412
  "nbytes": 4096,
1413
  "byteOffset": 15485952
 
1429
  2048,
1430
  48
1431
  ],
1432
+ "dtype": "float32",
1433
  "format": "f32-to-bf16",
1434
  "nbytes": 196608,
1435
  "byteOffset": 17062912
 
1451
  1536,
1452
  48
1453
  ],
1454
+ "dtype": "float32",
1455
  "format": "f32-to-bf16",
1456
  "nbytes": 147456,
1457
  "byteOffset": 18439168
 
1461
  "shape": [
1462
  1536
1463
  ],
1464
+ "dtype": "float32",
1465
  "format": "f32-to-bf16",
1466
  "nbytes": 3072,
1467
  "byteOffset": 18586624
 
1483
  1536,
1484
  280
1485
  ],
1486
+ "dtype": "float32",
1487
  "format": "f32-to-bf16",
1488
  "nbytes": 860160,
1489
  "byteOffset": 25470976
1490
  }
1491
  ],
1492
+ "md5sum": "35700f4804c01da98c6241cee2ff5732"
1493
  },
1494
  {
1495
  "dataPath": "params_shard_14.bin",
 
1513
  17920,
1514
  48
1515
  ],
1516
+ "dtype": "float32",
1517
  "format": "f32-to-bf16",
1518
  "nbytes": 1720320,
1519
  "byteOffset": 13762560
 
1523
  "shape": [
1524
  1536
1525
  ],
1526
+ "dtype": "float32",
1527
  "format": "f32-to-bf16",
1528
  "nbytes": 3072,
1529
  "byteOffset": 15482880
 
1533
  "shape": [
1534
  2048
1535
  ],
1536
+ "dtype": "float32",
1537
  "format": "f32-to-bf16",
1538
  "nbytes": 4096,
1539
  "byteOffset": 15485952
 
1555
  2048,
1556
  48
1557
  ],
1558
+ "dtype": "float32",
1559
  "format": "f32-to-bf16",
1560
  "nbytes": 196608,
1561
  "byteOffset": 17062912
 
1577
  1536,
1578
  48
1579
  ],
1580
+ "dtype": "float32",
1581
  "format": "f32-to-bf16",
1582
  "nbytes": 147456,
1583
  "byteOffset": 18439168
 
1587
  "shape": [
1588
  1536
1589
  ],
1590
+ "dtype": "float32",
1591
  "format": "f32-to-bf16",
1592
  "nbytes": 3072,
1593
  "byteOffset": 18586624
 
1609
  1536,
1610
  280
1611
  ],
1612
+ "dtype": "float32",
1613
  "format": "f32-to-bf16",
1614
  "nbytes": 860160,
1615
  "byteOffset": 25470976
1616
  }
1617
  ],
1618
+ "md5sum": "fc44a49e8c67d1e47c7d9f9b47c32cb5"
1619
  },
1620
  {
1621
  "dataPath": "params_shard_15.bin",
 
1639
  17920,
1640
  48
1641
  ],
1642
+ "dtype": "float32",
1643
  "format": "f32-to-bf16",
1644
  "nbytes": 1720320,
1645
  "byteOffset": 13762560
 
1649
  "shape": [
1650
  1536
1651
  ],
1652
+ "dtype": "float32",
1653
  "format": "f32-to-bf16",
1654
  "nbytes": 3072,
1655
  "byteOffset": 15482880
 
1659
  "shape": [
1660
  2048
1661
  ],
1662
+ "dtype": "float32",
1663
  "format": "f32-to-bf16",
1664
  "nbytes": 4096,
1665
  "byteOffset": 15485952
 
1681
  2048,
1682
  48
1683
  ],
1684
+ "dtype": "float32",
1685
  "format": "f32-to-bf16",
1686
  "nbytes": 196608,
1687
  "byteOffset": 17062912
 
1703
  1536,
1704
  48
1705
  ],
1706
+ "dtype": "float32",
1707
  "format": "f32-to-bf16",
1708
  "nbytes": 147456,
1709
  "byteOffset": 18439168
 
1713
  "shape": [
1714
  1536
1715
  ],
1716
+ "dtype": "float32",
1717
  "format": "f32-to-bf16",
1718
  "nbytes": 3072,
1719
  "byteOffset": 18586624
 
1735
  1536,
1736
  280
1737
  ],
1738
+ "dtype": "float32",
1739
  "format": "f32-to-bf16",
1740
  "nbytes": 860160,
1741
  "byteOffset": 25470976
1742
  }
1743
  ],
1744
+ "md5sum": "66952571c7809812a74701771112d5ac"
1745
  },
1746
  {
1747
  "dataPath": "params_shard_16.bin",
 
1765
  17920,
1766
  48
1767
  ],
1768
+ "dtype": "float32",
1769
  "format": "f32-to-bf16",
1770
  "nbytes": 1720320,
1771
  "byteOffset": 13762560
 
1775
  "shape": [
1776
  1536
1777
  ],
1778
+ "dtype": "float32",
1779
  "format": "f32-to-bf16",
1780
  "nbytes": 3072,
1781
  "byteOffset": 15482880
 
1785
  "shape": [
1786
  2048
1787
  ],
1788
+ "dtype": "float32",
1789
  "format": "f32-to-bf16",
1790
  "nbytes": 4096,
1791
  "byteOffset": 15485952
 
1807
  2048,
1808
  48
1809
  ],
1810
+ "dtype": "float32",
1811
  "format": "f32-to-bf16",
1812
  "nbytes": 196608,
1813
  "byteOffset": 17062912
 
1829
  1536,
1830
  48
1831
  ],
1832
+ "dtype": "float32",
1833
  "format": "f32-to-bf16",
1834
  "nbytes": 147456,
1835
  "byteOffset": 18439168
 
1839
  "shape": [
1840
  1536
1841
  ],
1842
+ "dtype": "float32",
1843
  "format": "f32-to-bf16",
1844
  "nbytes": 3072,
1845
  "byteOffset": 18586624
 
1861
  1536,
1862
  280
1863
  ],
1864
+ "dtype": "float32",
1865
  "format": "f32-to-bf16",
1866
  "nbytes": 860160,
1867
  "byteOffset": 25470976
1868
  }
1869
  ],
1870
+ "md5sum": "451ddd6918f481774a5ddcae93fcc19a"
1871
  },
1872
  {
1873
  "dataPath": "params_shard_17.bin",
 
1891
  17920,
1892
  48
1893
  ],
1894
+ "dtype": "float32",
1895
  "format": "f32-to-bf16",
1896
  "nbytes": 1720320,
1897
  "byteOffset": 13762560
 
1901
  "shape": [
1902
  1536
1903
  ],
1904
+ "dtype": "float32",
1905
  "format": "f32-to-bf16",
1906
  "nbytes": 3072,
1907
  "byteOffset": 15482880
 
1911
  "shape": [
1912
  2048
1913
  ],
1914
+ "dtype": "float32",
1915
  "format": "f32-to-bf16",
1916
  "nbytes": 4096,
1917
  "byteOffset": 15485952
 
1933
  2048,
1934
  48
1935
  ],
1936
+ "dtype": "float32",
1937
  "format": "f32-to-bf16",
1938
  "nbytes": 196608,
1939
  "byteOffset": 17062912
 
1955
  1536,
1956
  48
1957
  ],
1958
+ "dtype": "float32",
1959
  "format": "f32-to-bf16",
1960
  "nbytes": 147456,
1961
  "byteOffset": 18439168
 
1965
  "shape": [
1966
  1536
1967
  ],
1968
+ "dtype": "float32",
1969
  "format": "f32-to-bf16",
1970
  "nbytes": 3072,
1971
  "byteOffset": 18586624
 
1987
  1536,
1988
  280
1989
  ],
1990
+ "dtype": "float32",
1991
  "format": "f32-to-bf16",
1992
  "nbytes": 860160,
1993
  "byteOffset": 25470976
1994
  }
1995
  ],
1996
+ "md5sum": "6d6e530a4f2c516481ef459c432eab73"
1997
  },
1998
  {
1999
  "dataPath": "params_shard_18.bin",
 
2017
  17920,
2018
  48
2019
  ],
2020
+ "dtype": "float32",
2021
  "format": "f32-to-bf16",
2022
  "nbytes": 1720320,
2023
  "byteOffset": 13762560
 
2027
  "shape": [
2028
  1536
2029
  ],
2030
+ "dtype": "float32",
2031
  "format": "f32-to-bf16",
2032
  "nbytes": 3072,
2033
  "byteOffset": 15482880
 
2037
  "shape": [
2038
  2048
2039
  ],
2040
+ "dtype": "float32",
2041
  "format": "f32-to-bf16",
2042
  "nbytes": 4096,
2043
  "byteOffset": 15485952
 
2059
  2048,
2060
  48
2061
  ],
2062
+ "dtype": "float32",
2063
  "format": "f32-to-bf16",
2064
  "nbytes": 196608,
2065
  "byteOffset": 17062912
 
2081
  1536,
2082
  48
2083
  ],
2084
+ "dtype": "float32",
2085
  "format": "f32-to-bf16",
2086
  "nbytes": 147456,
2087
  "byteOffset": 18439168
 
2091
  "shape": [
2092
  1536
2093
  ],
2094
+ "dtype": "float32",
2095
  "format": "f32-to-bf16",
2096
  "nbytes": 3072,
2097
  "byteOffset": 18586624
 
2113
  1536,
2114
  280
2115
  ],
2116
+ "dtype": "float32",
2117
  "format": "f32-to-bf16",
2118
  "nbytes": 860160,
2119
  "byteOffset": 25470976
2120
  }
2121
  ],
2122
+ "md5sum": "0e25e76a52534e27e009f1966b60e908"
2123
  },
2124
  {
2125
  "dataPath": "params_shard_19.bin",
 
2143
  17920,
2144
  48
2145
  ],
2146
+ "dtype": "float32",
2147
  "format": "f32-to-bf16",
2148
  "nbytes": 1720320,
2149
  "byteOffset": 13762560
 
2153
  "shape": [
2154
  1536
2155
  ],
2156
+ "dtype": "float32",
2157
  "format": "f32-to-bf16",
2158
  "nbytes": 3072,
2159
  "byteOffset": 15482880
 
2163
  "shape": [
2164
  2048
2165
  ],
2166
+ "dtype": "float32",
2167
  "format": "f32-to-bf16",
2168
  "nbytes": 4096,
2169
  "byteOffset": 15485952
 
2185
  2048,
2186
  48
2187
  ],
2188
+ "dtype": "float32",
2189
  "format": "f32-to-bf16",
2190
  "nbytes": 196608,
2191
  "byteOffset": 17062912
 
2207
  1536,
2208
  48
2209
  ],
2210
+ "dtype": "float32",
2211
  "format": "f32-to-bf16",
2212
  "nbytes": 147456,
2213
  "byteOffset": 18439168
 
2217
  "shape": [
2218
  1536
2219
  ],
2220
+ "dtype": "float32",
2221
  "format": "f32-to-bf16",
2222
  "nbytes": 3072,
2223
  "byteOffset": 18586624
 
2239
  1536,
2240
  280
2241
  ],
2242
+ "dtype": "float32",
2243
  "format": "f32-to-bf16",
2244
  "nbytes": 860160,
2245
  "byteOffset": 25470976
2246
  }
2247
  ],
2248
+ "md5sum": "0b2f3521eb647a178bf4fe69ebbefca4"
2249
  },
2250
  {
2251
  "dataPath": "params_shard_20.bin",
 
2269
  17920,
2270
  48
2271
  ],
2272
+ "dtype": "float32",
2273
  "format": "f32-to-bf16",
2274
  "nbytes": 1720320,
2275
  "byteOffset": 13762560
 
2279
  "shape": [
2280
  1536
2281
  ],
2282
+ "dtype": "float32",
2283
  "format": "f32-to-bf16",
2284
  "nbytes": 3072,
2285
  "byteOffset": 15482880
 
2289
  "shape": [
2290
  2048
2291
  ],
2292
+ "dtype": "float32",
2293
  "format": "f32-to-bf16",
2294
  "nbytes": 4096,
2295
  "byteOffset": 15485952
 
2311
  2048,
2312
  48
2313
  ],
2314
+ "dtype": "float32",
2315
  "format": "f32-to-bf16",
2316
  "nbytes": 196608,
2317
  "byteOffset": 17062912
 
2333
  1536,
2334
  48
2335
  ],
2336
+ "dtype": "float32",
2337
  "format": "f32-to-bf16",
2338
  "nbytes": 147456,
2339
  "byteOffset": 18439168
 
2343
  "shape": [
2344
  1536
2345
  ],
2346
+ "dtype": "float32",
2347
  "format": "f32-to-bf16",
2348
  "nbytes": 3072,
2349
  "byteOffset": 18586624
 
2365
  1536,
2366
  280
2367
  ],
2368
+ "dtype": "float32",
2369
  "format": "f32-to-bf16",
2370
  "nbytes": 860160,
2371
  "byteOffset": 25470976
2372
  }
2373
  ],
2374
+ "md5sum": "176c5666e37994d7f23960de639e90cc"
2375
  },
2376
  {
2377
  "dataPath": "params_shard_21.bin",
 
2395
  17920,
2396
  48
2397
  ],
2398
+ "dtype": "float32",
2399
  "format": "f32-to-bf16",
2400
  "nbytes": 1720320,
2401
  "byteOffset": 13762560
 
2405
  "shape": [
2406
  1536
2407
  ],
2408
+ "dtype": "float32",
2409
  "format": "f32-to-bf16",
2410
  "nbytes": 3072,
2411
  "byteOffset": 15482880
 
2415
  "shape": [
2416
  2048
2417
  ],
2418
+ "dtype": "float32",
2419
  "format": "f32-to-bf16",
2420
  "nbytes": 4096,
2421
  "byteOffset": 15485952
 
2437
  2048,
2438
  48
2439
  ],
2440
+ "dtype": "float32",
2441
  "format": "f32-to-bf16",
2442
  "nbytes": 196608,
2443
  "byteOffset": 17062912
 
2459
  1536,
2460
  48
2461
  ],
2462
+ "dtype": "float32",
2463
  "format": "f32-to-bf16",
2464
  "nbytes": 147456,
2465
  "byteOffset": 18439168
 
2469
  "shape": [
2470
  1536
2471
  ],
2472
+ "dtype": "float32",
2473
  "format": "f32-to-bf16",
2474
  "nbytes": 3072,
2475
  "byteOffset": 18586624
 
2491
  1536,
2492
  280
2493
  ],
2494
+ "dtype": "float32",
2495
  "format": "f32-to-bf16",
2496
  "nbytes": 860160,
2497
  "byteOffset": 25470976
2498
  }
2499
  ],
2500
+ "md5sum": "ceb962974aa3ffd06a616a6c52270097"
2501
  },
2502
  {
2503
  "dataPath": "params_shard_22.bin",
 
2521
  17920,
2522
  48
2523
  ],
2524
+ "dtype": "float32",
2525
  "format": "f32-to-bf16",
2526
  "nbytes": 1720320,
2527
  "byteOffset": 13762560
 
2531
  "shape": [
2532
  1536
2533
  ],
2534
+ "dtype": "float32",
2535
  "format": "f32-to-bf16",
2536
  "nbytes": 3072,
2537
  "byteOffset": 15482880
 
2541
  "shape": [
2542
  2048
2543
  ],
2544
+ "dtype": "float32",
2545
  "format": "f32-to-bf16",
2546
  "nbytes": 4096,
2547
  "byteOffset": 15485952
 
2563
  2048,
2564
  48
2565
  ],
2566
+ "dtype": "float32",
2567
  "format": "f32-to-bf16",
2568
  "nbytes": 196608,
2569
  "byteOffset": 17062912
 
2585
  1536,
2586
  48
2587
  ],
2588
+ "dtype": "float32",
2589
  "format": "f32-to-bf16",
2590
  "nbytes": 147456,
2591
  "byteOffset": 18439168
 
2595
  "shape": [
2596
  1536
2597
  ],
2598
+ "dtype": "float32",
2599
  "format": "f32-to-bf16",
2600
  "nbytes": 3072,
2601
  "byteOffset": 18586624
 
2617
  1536,
2618
  280
2619
  ],
2620
+ "dtype": "float32",
2621
  "format": "f32-to-bf16",
2622
  "nbytes": 860160,
2623
  "byteOffset": 25470976
2624
  }
2625
  ],
2626
+ "md5sum": "ab9d7f443673b7890cfbf49008594ab9"
2627
  },
2628
  {
2629
  "dataPath": "params_shard_23.bin",
 
2647
  17920,
2648
  48
2649
  ],
2650
+ "dtype": "float32",
2651
  "format": "f32-to-bf16",
2652
  "nbytes": 1720320,
2653
  "byteOffset": 13762560
 
2657
  "shape": [
2658
  1536
2659
  ],
2660
+ "dtype": "float32",
2661
  "format": "f32-to-bf16",
2662
  "nbytes": 3072,
2663
  "byteOffset": 15482880
 
2667
  "shape": [
2668
  2048
2669
  ],
2670
+ "dtype": "float32",
2671
  "format": "f32-to-bf16",
2672
  "nbytes": 4096,
2673
  "byteOffset": 15485952
 
2689
  2048,
2690
  48
2691
  ],
2692
+ "dtype": "float32",
2693
  "format": "f32-to-bf16",
2694
  "nbytes": 196608,
2695
  "byteOffset": 17062912
 
2711
  1536,
2712
  48
2713
  ],
2714
+ "dtype": "float32",
2715
  "format": "f32-to-bf16",
2716
  "nbytes": 147456,
2717
  "byteOffset": 18439168
 
2721
  "shape": [
2722
  1536
2723
  ],
2724
+ "dtype": "float32",
2725
  "format": "f32-to-bf16",
2726
  "nbytes": 3072,
2727
  "byteOffset": 18586624
 
2743
  1536,
2744
  280
2745
  ],
2746
+ "dtype": "float32",
2747
  "format": "f32-to-bf16",
2748
  "nbytes": 860160,
2749
  "byteOffset": 25470976
2750
  }
2751
  ],
2752
+ "md5sum": "61f19df02bf82992f18b0a6ec1370776"
2753
  },
2754
  {
2755
  "dataPath": "params_shard_24.bin",
 
2773
  17920,
2774
  48
2775
  ],
2776
+ "dtype": "float32",
2777
  "format": "f32-to-bf16",
2778
  "nbytes": 1720320,
2779
  "byteOffset": 13762560
 
2783
  "shape": [
2784
  1536
2785
  ],
2786
+ "dtype": "float32",
2787
  "format": "f32-to-bf16",
2788
  "nbytes": 3072,
2789
  "byteOffset": 15482880
 
2793
  "shape": [
2794
  2048
2795
  ],
2796
+ "dtype": "float32",
2797
  "format": "f32-to-bf16",
2798
  "nbytes": 4096,
2799
  "byteOffset": 15485952
 
2815
  2048,
2816
  48
2817
  ],
2818
+ "dtype": "float32",
2819
  "format": "f32-to-bf16",
2820
  "nbytes": 196608,
2821
  "byteOffset": 17062912
 
2837
  1536,
2838
  48
2839
  ],
2840
+ "dtype": "float32",
2841
  "format": "f32-to-bf16",
2842
  "nbytes": 147456,
2843
  "byteOffset": 18439168
 
2847
  "shape": [
2848
  1536
2849
  ],
2850
+ "dtype": "float32",
2851
  "format": "f32-to-bf16",
2852
  "nbytes": 3072,
2853
  "byteOffset": 18586624
 
2869
  1536,
2870
  280
2871
  ],
2872
+ "dtype": "float32",
2873
  "format": "f32-to-bf16",
2874
  "nbytes": 860160,
2875
  "byteOffset": 25470976
2876
  }
2877
  ],
2878
+ "md5sum": "9bd46c03febaca7936dd5c670e87c9db"
2879
  },
2880
  {
2881
  "dataPath": "params_shard_25.bin",
 
2899
  17920,
2900
  48
2901
  ],
2902
+ "dtype": "float32",
2903
  "format": "f32-to-bf16",
2904
  "nbytes": 1720320,
2905
  "byteOffset": 13762560
 
2909
  "shape": [
2910
  1536
2911
  ],
2912
+ "dtype": "float32",
2913
  "format": "f32-to-bf16",
2914
  "nbytes": 3072,
2915
  "byteOffset": 15482880
 
2919
  "shape": [
2920
  2048
2921
  ],
2922
+ "dtype": "float32",
2923
  "format": "f32-to-bf16",
2924
  "nbytes": 4096,
2925
  "byteOffset": 15485952
 
2941
  2048,
2942
  48
2943
  ],
2944
+ "dtype": "float32",
2945
  "format": "f32-to-bf16",
2946
  "nbytes": 196608,
2947
  "byteOffset": 17062912
 
2963
  1536,
2964
  48
2965
  ],
2966
+ "dtype": "float32",
2967
  "format": "f32-to-bf16",
2968
  "nbytes": 147456,
2969
  "byteOffset": 18439168
 
2973
  "shape": [
2974
  1536
2975
  ],
2976
+ "dtype": "float32",
2977
  "format": "f32-to-bf16",
2978
  "nbytes": 3072,
2979
  "byteOffset": 18586624
 
2995
  1536,
2996
  280
2997
  ],
2998
+ "dtype": "float32",
2999
  "format": "f32-to-bf16",
3000
  "nbytes": 860160,
3001
  "byteOffset": 25470976
3002
  }
3003
  ],
3004
+ "md5sum": "a967b6249d494149ba4d36888fb580be"
3005
  },
3006
  {
3007
  "dataPath": "params_shard_26.bin",
 
3025
  17920,
3026
  48
3027
  ],
3028
+ "dtype": "float32",
3029
  "format": "f32-to-bf16",
3030
  "nbytes": 1720320,
3031
  "byteOffset": 13762560
 
3035
  "shape": [
3036
  1536
3037
  ],
3038
+ "dtype": "float32",
3039
  "format": "f32-to-bf16",
3040
  "nbytes": 3072,
3041
  "byteOffset": 15482880
 
3045
  "shape": [
3046
  2048
3047
  ],
3048
+ "dtype": "float32",
3049
  "format": "f32-to-bf16",
3050
  "nbytes": 4096,
3051
  "byteOffset": 15485952
 
3067
  2048,
3068
  48
3069
  ],
3070
+ "dtype": "float32",
3071
  "format": "f32-to-bf16",
3072
  "nbytes": 196608,
3073
  "byteOffset": 17062912
 
3089
  1536,
3090
  48
3091
  ],
3092
+ "dtype": "float32",
3093
  "format": "f32-to-bf16",
3094
  "nbytes": 147456,
3095
  "byteOffset": 18439168
 
3099
  "shape": [
3100
  1536
3101
  ],
3102
+ "dtype": "float32",
3103
  "format": "f32-to-bf16",
3104
  "nbytes": 3072,
3105
  "byteOffset": 18586624
 
3121
  1536,
3122
  280
3123
  ],
3124
+ "dtype": "float32",
3125
  "format": "f32-to-bf16",
3126
  "nbytes": 860160,
3127
  "byteOffset": 25470976
3128
  }
3129
  ],
3130
+ "md5sum": "c456c605796669a1a035b5509af8b906"
3131
  },
3132
  {
3133
  "dataPath": "params_shard_27.bin",
 
3151
  17920,
3152
  48
3153
  ],
3154
+ "dtype": "float32",
3155
  "format": "f32-to-bf16",
3156
  "nbytes": 1720320,
3157
  "byteOffset": 13762560
 
3161
  "shape": [
3162
  1536
3163
  ],
3164
+ "dtype": "float32",
3165
  "format": "f32-to-bf16",
3166
  "nbytes": 3072,
3167
  "byteOffset": 15482880
 
3171
  "shape": [
3172
  2048
3173
  ],
3174
+ "dtype": "float32",
3175
  "format": "f32-to-bf16",
3176
  "nbytes": 4096,
3177
  "byteOffset": 15485952
 
3193
  2048,
3194
  48
3195
  ],
3196
+ "dtype": "float32",
3197
  "format": "f32-to-bf16",
3198
  "nbytes": 196608,
3199
  "byteOffset": 17062912
 
3215
  1536,
3216
  48
3217
  ],
3218
+ "dtype": "float32",
3219
  "format": "f32-to-bf16",
3220
  "nbytes": 147456,
3221
  "byteOffset": 18439168
 
3225
  "shape": [
3226
  1536
3227
  ],
3228
+ "dtype": "float32",
3229
  "format": "f32-to-bf16",
3230
  "nbytes": 3072,
3231
  "byteOffset": 18586624
 
3247
  1536,
3248
  280
3249
  ],
3250
+ "dtype": "float32",
3251
  "format": "f32-to-bf16",
3252
  "nbytes": 860160,
3253
  "byteOffset": 25470976
3254
  }
3255
  ],
3256
+ "md5sum": "4932c078feff0216f175050579e08a9a"
3257
  },
3258
  {
3259
  "dataPath": "params_shard_28.bin",
 
3277
  17920,
3278
  48
3279
  ],
3280
+ "dtype": "float32",
3281
  "format": "f32-to-bf16",
3282
  "nbytes": 1720320,
3283
  "byteOffset": 13762560
 
3287
  "shape": [
3288
  1536
3289
  ],
3290
+ "dtype": "float32",
3291
  "format": "f32-to-bf16",
3292
  "nbytes": 3072,
3293
  "byteOffset": 15482880
 
3297
  "shape": [
3298
  2048
3299
  ],
3300
+ "dtype": "float32",
3301
  "format": "f32-to-bf16",
3302
  "nbytes": 4096,
3303
  "byteOffset": 15485952
 
3319
  2048,
3320
  48
3321
  ],
3322
+ "dtype": "float32",
3323
  "format": "f32-to-bf16",
3324
  "nbytes": 196608,
3325
  "byteOffset": 17062912
 
3341
  1536,
3342
  48
3343
  ],
3344
+ "dtype": "float32",
3345
  "format": "f32-to-bf16",
3346
  "nbytes": 147456,
3347
  "byteOffset": 18439168
 
3351
  "shape": [
3352
  1536
3353
  ],
3354
+ "dtype": "float32",
3355
  "format": "f32-to-bf16",
3356
  "nbytes": 3072,
3357
  "byteOffset": 18586624
 
3373
  1536,
3374
  280
3375
  ],
3376
+ "dtype": "float32",
3377
  "format": "f32-to-bf16",
3378
  "nbytes": 860160,
3379
  "byteOffset": 25470976
3380
  }
3381
  ],
3382
+ "md5sum": "8686b64ff10449b640afc32ed7439a65"
3383
  },
3384
  {
3385
  "dataPath": "params_shard_29.bin",
 
3403
  17920,
3404
  48
3405
  ],
3406
+ "dtype": "float32",
3407
  "format": "f32-to-bf16",
3408
  "nbytes": 1720320,
3409
  "byteOffset": 13762560
 
3413
  "shape": [
3414
  1536
3415
  ],
3416
+ "dtype": "float32",
3417
  "format": "f32-to-bf16",
3418
  "nbytes": 3072,
3419
  "byteOffset": 15482880
 
3423
  "shape": [
3424
  2048
3425
  ],
3426
+ "dtype": "float32",
3427
  "format": "f32-to-bf16",
3428
  "nbytes": 4096,
3429
  "byteOffset": 15485952
 
3445
  2048,
3446
  48
3447
  ],
3448
+ "dtype": "float32",
3449
  "format": "f32-to-bf16",
3450
  "nbytes": 196608,
3451
  "byteOffset": 17062912
 
3467
  1536,
3468
  48
3469
  ],
3470
+ "dtype": "float32",
3471
  "format": "f32-to-bf16",
3472
  "nbytes": 147456,
3473
  "byteOffset": 18439168
 
3477
  "shape": [
3478
  1536
3479
  ],
3480
+ "dtype": "float32",
3481
  "format": "f32-to-bf16",
3482
  "nbytes": 3072,
3483
  "byteOffset": 18586624
 
3499
  1536,
3500
  280
3501
  ],
3502
+ "dtype": "float32",
3503
  "format": "f32-to-bf16",
3504
  "nbytes": 860160,
3505
  "byteOffset": 25470976
3506
  }
3507
  ],
3508
+ "md5sum": "037698a9234e2d563a950ced66a97bf3"
3509
  },
3510
  {
3511
  "dataPath": "params_shard_30.bin",
 
3529
  17920,
3530
  48
3531
  ],
3532
+ "dtype": "float32",
3533
  "format": "f32-to-bf16",
3534
  "nbytes": 1720320,
3535
  "byteOffset": 13762560
 
3539
  "shape": [
3540
  1536
3541
  ],
3542
+ "dtype": "float32",
3543
  "format": "f32-to-bf16",
3544
  "nbytes": 3072,
3545
  "byteOffset": 15482880
 
3549
  "shape": [
3550
  2048
3551
  ],
3552
+ "dtype": "float32",
3553
  "format": "f32-to-bf16",
3554
  "nbytes": 4096,
3555
  "byteOffset": 15485952
 
3571
  2048,
3572
  48
3573
  ],
3574
+ "dtype": "float32",
3575
  "format": "f32-to-bf16",
3576
  "nbytes": 196608,
3577
  "byteOffset": 17062912
 
3593
  1536,
3594
  48
3595
  ],
3596
+ "dtype": "float32",
3597
  "format": "f32-to-bf16",
3598
  "nbytes": 147456,
3599
  "byteOffset": 18439168
 
3603
  "shape": [
3604
  1536
3605
  ],
3606
+ "dtype": "float32",
3607
  "format": "f32-to-bf16",
3608
  "nbytes": 3072,
3609
  "byteOffset": 18586624
3610
  }
3611
  ],
3612
+ "md5sum": "e5c2ee400f5502dbba790e85967f0990"
3613
  }
3614
  ]
3615
  }
params_shard_0.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec4813c1c77b8d0d3d362848966ed3f6bec760c329a9b4024278758d97c1c36d
3
  size 116686848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4d1fa25bab93bdee27531e61adba6dc2caea6073c31a2fd544f63dda2b338af
3
  size 116686848
params_shard_1.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d27b68ff3b61089610d2431d3097a288ac8abbf6027012755013b280e4fb438f
3
  size 116686848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29ab837f64b3ac1937cbbe3dfd24c9958bc8208f9d3bf96e27c64164ba5ed5e7
3
  size 116686848
params_shard_10.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c434bf8c1a12c70f82cbfd1a1fd032c36062e0d0624ee854869a2918b95adcc
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b9804d09b1e919ed3b75a68ce2ee69ee3d710337b06af79a9bef033208ad4a3
3
  size 26331136
params_shard_11.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:658ee406da70e5f872ea5f93d749c2f23e68c68a6cc7ad63f855dc3f6e0639d1
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db2a5b10f92bf55dea115a922c3d0542a8f4d37a504a2decd7f96d9b67bf8dd5
3
  size 26331136
params_shard_12.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2970d7dd049a487bb1415cfd7ccc15bec06cea60a38a42c68e5886cfaa02643c
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24b30d6f4efacbf535ef4c4178e181ce6f9f1b68e9e5b60568afd1f534dbad91
3
  size 26331136
params_shard_13.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a014ab75a88523f552997270404aad87a746887ed9a3092c83b250594b7badc6
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30467c7f05df29c3117913518d89d634dea9a6d38b6c487a3b3e74d88fc3a583
3
  size 26331136
params_shard_14.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5cff56a70ee401359ff0f2cd9169d3abc8fff240ee42f713954cd959195fc786
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c066570bc414c818ed3a7ae2feefc9c154f83bb3e5a14eb134e409b2b03c353
3
  size 26331136
params_shard_15.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0df414862e8be0cf7ba70ebefc89eafb80108a492c5d2190ff16b523b651fbfa
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02f86898b41c5670edf82e3afa5a91760c1b33d88b30e8fbd664a6e87ce42c4b
3
  size 26331136
params_shard_16.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:868cc2f94a7fa22126a155cc5e06b14fed5f95b83af00b736755b846c7b3ba13
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29c070a0392cf4a29855b381d126fa1dff21567162b0a9305fe7244a29060b21
3
  size 26331136
params_shard_17.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f73f777b8611905d18bae711f8f2a97a88f92f45aa21d8b6f05c3ebea3453135
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3f37453bfee2894fd2225c75bcecf3b8ac63a1a732b90c0f7a387c824812476
3
  size 26331136
params_shard_18.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd03d9b6d8d2dd9fbdcb490c798c544957bb9569e3e58bcb00a932795e2cd7f3
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f52432700ffb5c2506d6939133fc0e1366842bfc5b6398830498e0695ee7460e
3
  size 26331136
params_shard_19.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5eb39dac820c506c9c37ba3da690a88da7a2a48c5920deb096d4c7ee88371678
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3692ddfabe072c1376ed61209bcb42d2cb4f430ee01911cac98ad541212c7ad
3
  size 26331136
params_shard_2.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2c9ac194aa5ed68623826af040327a6ee43a8923d71eeced5a9554666dce213
3
  size 29174784
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0168a8b8f6459dad35d5fc9956219d31414b7ec246b3a019bfb29d92968c496e
3
  size 29174784
params_shard_20.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61fd3429478f1c85e5d9cdf34d37a3306fea8be8acdced8e2e407c16d910389b
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d30e8dc087c3801f92bf962d514c99b6e54e07e3cd4e726b371df4090c03f861
3
  size 26331136
params_shard_21.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:268247137646af01cad889dc6a12e229cfcf29d3ed9b96d0fe1850821e9362d1
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:befae26ea25cc5919bb9646fea6496b78e7100b836db9c52439fd5910cea3703
3
  size 26331136
params_shard_22.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31b1a3a86c5198b3e0b537f9f05d92ca3b22b5d6747ff4450e4413171289f549
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65c5c86b043d62bac22d6d7f591e345568eaffe9a0484f2abdaefac15cae57df
3
  size 26331136
params_shard_23.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c54e39305bea2b781d6e5c518ea81d9dfe05ccb1a19306d02250fb2411bb41ae
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00b663c5bb64030d233a6f0c449fa5343c61b036e432d1d6928544cd85b49b7f
3
  size 26331136
params_shard_24.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:879358a57f9e2e8c15645afe76147f6f668769e2b02d33193f480de0acd80b47
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:677d1df1179512e30f372dc91f90684ee0af2ad0e3a4f63094f2a73ba6221b05
3
  size 26331136
params_shard_25.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b9d831dacea12adda34c79bcfc061574093e64290fd8fada3726f5c1efd8b77
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83d0ff8801ee8dce27cf701d7d2362672e1bb5f740ef7b38b74018fa42e6c129
3
  size 26331136
params_shard_26.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8607e8b3fe2ce80d0825e2dd4035e26318166bf487c2e062c792f5e2001192e4
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:616c37ad221a4b3d79b8bdad4e204507469e858a7724ab1d5da293134b21eca4
3
  size 26331136
params_shard_27.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01e21acdb9f3a722227431e258fd7b3aae74eea80ba10e9ebe78c9ca6b37bdd5
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fae875a6701fb126172d6b67d46269c97c3a58902143dd5c2f3b5f17f41a08dc
3
  size 26331136
params_shard_28.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75b01f6c5daf9e775d5c50e75d4cd99d10ddf9e0a5458e0f602630161bea7085
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9f0b0eeee4dcbfe3b1bafbe1d006a8203ebc43c15b8a17a6694d7a588d203c0
3
  size 26331136
params_shard_29.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:018f365ae1584512127502951877098287ac39f5ad7856e2eea263ad4f4262c6
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70694802b48fa31110c5b12bfb64c3f8d93dedc0c835197c72dad01026b92d54
3
  size 26331136
params_shard_3.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:807993187284a5a883cd20f80a113c25c5fde13d69606d526dcd0448cba20f82
3
  size 33212416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3340731366f5eef347332610f751ebb53a41d6c6058294f867daa6e7f09a3f14
3
  size 33212416
params_shard_30.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd225141d3e031ab77600c180cedc8c5ae3854b8fc584236a5317f12c0be380c
3
  size 18589696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86074eb00eb1ba19a4b9843af5d0921f40a0ea0465a23683365ad97da549e0e5
3
  size 18589696
params_shard_4.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eeda98d75827843b164b71597c17f33c833e859914017510728e9834505aa273
3
  size 27191296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35c1be0353e94b955b7d6b2040984634eaf25bfd184c2d97fc2ed23e37e83048
3
  size 27191296
params_shard_5.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9abf5d9053c11f6ad700d6f7572dad2832c9f579d6f217e0998a9a6e4aed4e2
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03a0ce57941633fa5f6a2e1d8faae013278e1fd22caf5d029cf0686da836a3ec
3
  size 26331136
params_shard_6.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4cd6910039baad6fce4467956a5179ca074e609dbcbebfe7261701ecf4a377a
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcea40b18bd7ef899c2aff644d66770baa7000e8fd5659ab28941d5e2bb2cc80
3
  size 26331136
params_shard_7.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:904b9b0c57e91b88a96c4aa7f8b47d80ec7f1ba2d0313743b85268b2c7a747ec
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:720ad30c2c64af45206f7c52a25091a5b35b463d0d86a31d584dbf525eabbe27
3
  size 26331136
params_shard_8.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:141a631925d702b7e681421c972908c707e0a544095a412547eacb68eb4c2de9
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d71409e44c67ea5ff80283a9cdc44e72d2b14bcc1977991fe1a36e7d981e3f09
3
  size 26331136
params_shard_9.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab485e831ccc43b7e10b2d0fc6880327ec14c9350c9d9157e8d54664c5871b3f
3
  size 26331136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65d2fac827f0f40496b8ea02ff1e9d560d1fe01e69b4d60156889d9cd38a75fd
3
  size 26331136