navodPeiris commited on
Commit
816872c
1 Parent(s): 58f4330
Files changed (1) hide show
  1. model.safetensors.index.json +2 -1765
model.safetensors.index.json CHANGED
@@ -1,1769 +1,6 @@
1
  {
2
- "index": {
3
- "lm_head.weight": {
4
- "dtype": "torch.bfloat16",
5
- "shape": [
6
- 32000,
7
- 2048
8
- ],
9
- "offset": 0,
10
- "length": 131072000
11
- },
12
- "model.embed_tokens.weight": {
13
- "dtype": "torch.bfloat16",
14
- "shape": [
15
- 32000,
16
- 2048
17
- ],
18
- "offset": 0,
19
- "length": 131072000
20
- },
21
- "model.layers.0.input_layernorm.weight": {
22
- "dtype": "torch.bfloat16",
23
- "shape": [
24
- 2048
25
- ],
26
- "offset": 0,
27
- "length": 4096
28
- },
29
- "model.layers.0.mlp.down_proj.weight": {
30
- "dtype": "torch.bfloat16",
31
- "shape": [
32
- 2048,
33
- 5632
34
- ],
35
- "offset": 0,
36
- "length": 23068672
37
- },
38
- "model.layers.0.mlp.gate_proj.weight": {
39
- "dtype": "torch.bfloat16",
40
- "shape": [
41
- 5632,
42
- 2048
43
- ],
44
- "offset": 0,
45
- "length": 23068672
46
- },
47
- "model.layers.0.mlp.up_proj.weight": {
48
- "dtype": "torch.bfloat16",
49
- "shape": [
50
- 5632,
51
- 2048
52
- ],
53
- "offset": 0,
54
- "length": 23068672
55
- },
56
- "model.layers.0.post_attention_layernorm.weight": {
57
- "dtype": "torch.bfloat16",
58
- "shape": [
59
- 2048
60
- ],
61
- "offset": 0,
62
- "length": 4096
63
- },
64
- "model.layers.0.self_attn.k_proj.weight": {
65
- "dtype": "torch.bfloat16",
66
- "shape": [
67
- 256,
68
- 2048
69
- ],
70
- "offset": 0,
71
- "length": 1048576
72
- },
73
- "model.layers.0.self_attn.o_proj.weight": {
74
- "dtype": "torch.bfloat16",
75
- "shape": [
76
- 2048,
77
- 2048
78
- ],
79
- "offset": 0,
80
- "length": 8388608
81
- },
82
- "model.layers.0.self_attn.q_proj.weight": {
83
- "dtype": "torch.bfloat16",
84
- "shape": [
85
- 2048,
86
- 2048
87
- ],
88
- "offset": 0,
89
- "length": 8388608
90
- },
91
- "model.layers.0.self_attn.v_proj.weight": {
92
- "dtype": "torch.bfloat16",
93
- "shape": [
94
- 256,
95
- 2048
96
- ],
97
- "offset": 0,
98
- "length": 1048576
99
- },
100
- "model.layers.1.input_layernorm.weight": {
101
- "dtype": "torch.bfloat16",
102
- "shape": [
103
- 2048
104
- ],
105
- "offset": 0,
106
- "length": 4096
107
- },
108
- "model.layers.1.mlp.down_proj.weight": {
109
- "dtype": "torch.bfloat16",
110
- "shape": [
111
- 2048,
112
- 5632
113
- ],
114
- "offset": 0,
115
- "length": 23068672
116
- },
117
- "model.layers.1.mlp.gate_proj.weight": {
118
- "dtype": "torch.bfloat16",
119
- "shape": [
120
- 5632,
121
- 2048
122
- ],
123
- "offset": 0,
124
- "length": 23068672
125
- },
126
- "model.layers.1.mlp.up_proj.weight": {
127
- "dtype": "torch.bfloat16",
128
- "shape": [
129
- 5632,
130
- 2048
131
- ],
132
- "offset": 0,
133
- "length": 23068672
134
- },
135
- "model.layers.1.post_attention_layernorm.weight": {
136
- "dtype": "torch.bfloat16",
137
- "shape": [
138
- 2048
139
- ],
140
- "offset": 0,
141
- "length": 4096
142
- },
143
- "model.layers.1.self_attn.k_proj.weight": {
144
- "dtype": "torch.bfloat16",
145
- "shape": [
146
- 256,
147
- 2048
148
- ],
149
- "offset": 0,
150
- "length": 1048576
151
- },
152
- "model.layers.1.self_attn.o_proj.weight": {
153
- "dtype": "torch.bfloat16",
154
- "shape": [
155
- 2048,
156
- 2048
157
- ],
158
- "offset": 0,
159
- "length": 8388608
160
- },
161
- "model.layers.1.self_attn.q_proj.weight": {
162
- "dtype": "torch.bfloat16",
163
- "shape": [
164
- 2048,
165
- 2048
166
- ],
167
- "offset": 0,
168
- "length": 8388608
169
- },
170
- "model.layers.1.self_attn.v_proj.weight": {
171
- "dtype": "torch.bfloat16",
172
- "shape": [
173
- 256,
174
- 2048
175
- ],
176
- "offset": 0,
177
- "length": 1048576
178
- },
179
- "model.layers.10.input_layernorm.weight": {
180
- "dtype": "torch.bfloat16",
181
- "shape": [
182
- 2048
183
- ],
184
- "offset": 0,
185
- "length": 4096
186
- },
187
- "model.layers.10.mlp.down_proj.weight": {
188
- "dtype": "torch.bfloat16",
189
- "shape": [
190
- 2048,
191
- 5632
192
- ],
193
- "offset": 0,
194
- "length": 23068672
195
- },
196
- "model.layers.10.mlp.gate_proj.weight": {
197
- "dtype": "torch.bfloat16",
198
- "shape": [
199
- 5632,
200
- 2048
201
- ],
202
- "offset": 0,
203
- "length": 23068672
204
- },
205
- "model.layers.10.mlp.up_proj.weight": {
206
- "dtype": "torch.bfloat16",
207
- "shape": [
208
- 5632,
209
- 2048
210
- ],
211
- "offset": 0,
212
- "length": 23068672
213
- },
214
- "model.layers.10.post_attention_layernorm.weight": {
215
- "dtype": "torch.bfloat16",
216
- "shape": [
217
- 2048
218
- ],
219
- "offset": 0,
220
- "length": 4096
221
- },
222
- "model.layers.10.self_attn.k_proj.weight": {
223
- "dtype": "torch.bfloat16",
224
- "shape": [
225
- 256,
226
- 2048
227
- ],
228
- "offset": 0,
229
- "length": 1048576
230
- },
231
- "model.layers.10.self_attn.o_proj.weight": {
232
- "dtype": "torch.bfloat16",
233
- "shape": [
234
- 2048,
235
- 2048
236
- ],
237
- "offset": 0,
238
- "length": 8388608
239
- },
240
- "model.layers.10.self_attn.q_proj.weight": {
241
- "dtype": "torch.bfloat16",
242
- "shape": [
243
- 2048,
244
- 2048
245
- ],
246
- "offset": 0,
247
- "length": 8388608
248
- },
249
- "model.layers.10.self_attn.v_proj.weight": {
250
- "dtype": "torch.bfloat16",
251
- "shape": [
252
- 256,
253
- 2048
254
- ],
255
- "offset": 0,
256
- "length": 1048576
257
- },
258
- "model.layers.11.input_layernorm.weight": {
259
- "dtype": "torch.bfloat16",
260
- "shape": [
261
- 2048
262
- ],
263
- "offset": 0,
264
- "length": 4096
265
- },
266
- "model.layers.11.mlp.down_proj.weight": {
267
- "dtype": "torch.bfloat16",
268
- "shape": [
269
- 2048,
270
- 5632
271
- ],
272
- "offset": 0,
273
- "length": 23068672
274
- },
275
- "model.layers.11.mlp.gate_proj.weight": {
276
- "dtype": "torch.bfloat16",
277
- "shape": [
278
- 5632,
279
- 2048
280
- ],
281
- "offset": 0,
282
- "length": 23068672
283
- },
284
- "model.layers.11.mlp.up_proj.weight": {
285
- "dtype": "torch.bfloat16",
286
- "shape": [
287
- 5632,
288
- 2048
289
- ],
290
- "offset": 0,
291
- "length": 23068672
292
- },
293
- "model.layers.11.post_attention_layernorm.weight": {
294
- "dtype": "torch.bfloat16",
295
- "shape": [
296
- 2048
297
- ],
298
- "offset": 0,
299
- "length": 4096
300
- },
301
- "model.layers.11.self_attn.k_proj.weight": {
302
- "dtype": "torch.bfloat16",
303
- "shape": [
304
- 256,
305
- 2048
306
- ],
307
- "offset": 0,
308
- "length": 1048576
309
- },
310
- "model.layers.11.self_attn.o_proj.weight": {
311
- "dtype": "torch.bfloat16",
312
- "shape": [
313
- 2048,
314
- 2048
315
- ],
316
- "offset": 0,
317
- "length": 8388608
318
- },
319
- "model.layers.11.self_attn.q_proj.weight": {
320
- "dtype": "torch.bfloat16",
321
- "shape": [
322
- 2048,
323
- 2048
324
- ],
325
- "offset": 0,
326
- "length": 8388608
327
- },
328
- "model.layers.11.self_attn.v_proj.weight": {
329
- "dtype": "torch.bfloat16",
330
- "shape": [
331
- 256,
332
- 2048
333
- ],
334
- "offset": 0,
335
- "length": 1048576
336
- },
337
- "model.layers.12.input_layernorm.weight": {
338
- "dtype": "torch.bfloat16",
339
- "shape": [
340
- 2048
341
- ],
342
- "offset": 0,
343
- "length": 4096
344
- },
345
- "model.layers.12.mlp.down_proj.weight": {
346
- "dtype": "torch.bfloat16",
347
- "shape": [
348
- 2048,
349
- 5632
350
- ],
351
- "offset": 0,
352
- "length": 23068672
353
- },
354
- "model.layers.12.mlp.gate_proj.weight": {
355
- "dtype": "torch.bfloat16",
356
- "shape": [
357
- 5632,
358
- 2048
359
- ],
360
- "offset": 0,
361
- "length": 23068672
362
- },
363
- "model.layers.12.mlp.up_proj.weight": {
364
- "dtype": "torch.bfloat16",
365
- "shape": [
366
- 5632,
367
- 2048
368
- ],
369
- "offset": 0,
370
- "length": 23068672
371
- },
372
- "model.layers.12.post_attention_layernorm.weight": {
373
- "dtype": "torch.bfloat16",
374
- "shape": [
375
- 2048
376
- ],
377
- "offset": 0,
378
- "length": 4096
379
- },
380
- "model.layers.12.self_attn.k_proj.weight": {
381
- "dtype": "torch.bfloat16",
382
- "shape": [
383
- 256,
384
- 2048
385
- ],
386
- "offset": 0,
387
- "length": 1048576
388
- },
389
- "model.layers.12.self_attn.o_proj.weight": {
390
- "dtype": "torch.bfloat16",
391
- "shape": [
392
- 2048,
393
- 2048
394
- ],
395
- "offset": 0,
396
- "length": 8388608
397
- },
398
- "model.layers.12.self_attn.q_proj.weight": {
399
- "dtype": "torch.bfloat16",
400
- "shape": [
401
- 2048,
402
- 2048
403
- ],
404
- "offset": 0,
405
- "length": 8388608
406
- },
407
- "model.layers.12.self_attn.v_proj.weight": {
408
- "dtype": "torch.bfloat16",
409
- "shape": [
410
- 256,
411
- 2048
412
- ],
413
- "offset": 0,
414
- "length": 1048576
415
- },
416
- "model.layers.13.input_layernorm.weight": {
417
- "dtype": "torch.bfloat16",
418
- "shape": [
419
- 2048
420
- ],
421
- "offset": 0,
422
- "length": 4096
423
- },
424
- "model.layers.13.mlp.down_proj.weight": {
425
- "dtype": "torch.bfloat16",
426
- "shape": [
427
- 2048,
428
- 5632
429
- ],
430
- "offset": 0,
431
- "length": 23068672
432
- },
433
- "model.layers.13.mlp.gate_proj.weight": {
434
- "dtype": "torch.bfloat16",
435
- "shape": [
436
- 5632,
437
- 2048
438
- ],
439
- "offset": 0,
440
- "length": 23068672
441
- },
442
- "model.layers.13.mlp.up_proj.weight": {
443
- "dtype": "torch.bfloat16",
444
- "shape": [
445
- 5632,
446
- 2048
447
- ],
448
- "offset": 0,
449
- "length": 23068672
450
- },
451
- "model.layers.13.post_attention_layernorm.weight": {
452
- "dtype": "torch.bfloat16",
453
- "shape": [
454
- 2048
455
- ],
456
- "offset": 0,
457
- "length": 4096
458
- },
459
- "model.layers.13.self_attn.k_proj.weight": {
460
- "dtype": "torch.bfloat16",
461
- "shape": [
462
- 256,
463
- 2048
464
- ],
465
- "offset": 0,
466
- "length": 1048576
467
- },
468
- "model.layers.13.self_attn.o_proj.weight": {
469
- "dtype": "torch.bfloat16",
470
- "shape": [
471
- 2048,
472
- 2048
473
- ],
474
- "offset": 0,
475
- "length": 8388608
476
- },
477
- "model.layers.13.self_attn.q_proj.weight": {
478
- "dtype": "torch.bfloat16",
479
- "shape": [
480
- 2048,
481
- 2048
482
- ],
483
- "offset": 0,
484
- "length": 8388608
485
- },
486
- "model.layers.13.self_attn.v_proj.weight": {
487
- "dtype": "torch.bfloat16",
488
- "shape": [
489
- 256,
490
- 2048
491
- ],
492
- "offset": 0,
493
- "length": 1048576
494
- },
495
- "model.layers.14.input_layernorm.weight": {
496
- "dtype": "torch.bfloat16",
497
- "shape": [
498
- 2048
499
- ],
500
- "offset": 0,
501
- "length": 4096
502
- },
503
- "model.layers.14.mlp.down_proj.weight": {
504
- "dtype": "torch.bfloat16",
505
- "shape": [
506
- 2048,
507
- 5632
508
- ],
509
- "offset": 0,
510
- "length": 23068672
511
- },
512
- "model.layers.14.mlp.gate_proj.weight": {
513
- "dtype": "torch.bfloat16",
514
- "shape": [
515
- 5632,
516
- 2048
517
- ],
518
- "offset": 0,
519
- "length": 23068672
520
- },
521
- "model.layers.14.mlp.up_proj.weight": {
522
- "dtype": "torch.bfloat16",
523
- "shape": [
524
- 5632,
525
- 2048
526
- ],
527
- "offset": 0,
528
- "length": 23068672
529
- },
530
- "model.layers.14.post_attention_layernorm.weight": {
531
- "dtype": "torch.bfloat16",
532
- "shape": [
533
- 2048
534
- ],
535
- "offset": 0,
536
- "length": 4096
537
- },
538
- "model.layers.14.self_attn.k_proj.weight": {
539
- "dtype": "torch.bfloat16",
540
- "shape": [
541
- 256,
542
- 2048
543
- ],
544
- "offset": 0,
545
- "length": 1048576
546
- },
547
- "model.layers.14.self_attn.o_proj.weight": {
548
- "dtype": "torch.bfloat16",
549
- "shape": [
550
- 2048,
551
- 2048
552
- ],
553
- "offset": 0,
554
- "length": 8388608
555
- },
556
- "model.layers.14.self_attn.q_proj.weight": {
557
- "dtype": "torch.bfloat16",
558
- "shape": [
559
- 2048,
560
- 2048
561
- ],
562
- "offset": 0,
563
- "length": 8388608
564
- },
565
- "model.layers.14.self_attn.v_proj.weight": {
566
- "dtype": "torch.bfloat16",
567
- "shape": [
568
- 256,
569
- 2048
570
- ],
571
- "offset": 0,
572
- "length": 1048576
573
- },
574
- "model.layers.15.input_layernorm.weight": {
575
- "dtype": "torch.bfloat16",
576
- "shape": [
577
- 2048
578
- ],
579
- "offset": 0,
580
- "length": 4096
581
- },
582
- "model.layers.15.mlp.down_proj.weight": {
583
- "dtype": "torch.bfloat16",
584
- "shape": [
585
- 2048,
586
- 5632
587
- ],
588
- "offset": 0,
589
- "length": 23068672
590
- },
591
- "model.layers.15.mlp.gate_proj.weight": {
592
- "dtype": "torch.bfloat16",
593
- "shape": [
594
- 5632,
595
- 2048
596
- ],
597
- "offset": 0,
598
- "length": 23068672
599
- },
600
- "model.layers.15.mlp.up_proj.weight": {
601
- "dtype": "torch.bfloat16",
602
- "shape": [
603
- 5632,
604
- 2048
605
- ],
606
- "offset": 0,
607
- "length": 23068672
608
- },
609
- "model.layers.15.post_attention_layernorm.weight": {
610
- "dtype": "torch.bfloat16",
611
- "shape": [
612
- 2048
613
- ],
614
- "offset": 0,
615
- "length": 4096
616
- },
617
- "model.layers.15.self_attn.k_proj.weight": {
618
- "dtype": "torch.bfloat16",
619
- "shape": [
620
- 256,
621
- 2048
622
- ],
623
- "offset": 0,
624
- "length": 1048576
625
- },
626
- "model.layers.15.self_attn.o_proj.weight": {
627
- "dtype": "torch.bfloat16",
628
- "shape": [
629
- 2048,
630
- 2048
631
- ],
632
- "offset": 0,
633
- "length": 8388608
634
- },
635
- "model.layers.15.self_attn.q_proj.weight": {
636
- "dtype": "torch.bfloat16",
637
- "shape": [
638
- 2048,
639
- 2048
640
- ],
641
- "offset": 0,
642
- "length": 8388608
643
- },
644
- "model.layers.15.self_attn.v_proj.weight": {
645
- "dtype": "torch.bfloat16",
646
- "shape": [
647
- 256,
648
- 2048
649
- ],
650
- "offset": 0,
651
- "length": 1048576
652
- },
653
- "model.layers.16.input_layernorm.weight": {
654
- "dtype": "torch.bfloat16",
655
- "shape": [
656
- 2048
657
- ],
658
- "offset": 0,
659
- "length": 4096
660
- },
661
- "model.layers.16.mlp.down_proj.weight": {
662
- "dtype": "torch.bfloat16",
663
- "shape": [
664
- 2048,
665
- 5632
666
- ],
667
- "offset": 0,
668
- "length": 23068672
669
- },
670
- "model.layers.16.mlp.gate_proj.weight": {
671
- "dtype": "torch.bfloat16",
672
- "shape": [
673
- 5632,
674
- 2048
675
- ],
676
- "offset": 0,
677
- "length": 23068672
678
- },
679
- "model.layers.16.mlp.up_proj.weight": {
680
- "dtype": "torch.bfloat16",
681
- "shape": [
682
- 5632,
683
- 2048
684
- ],
685
- "offset": 0,
686
- "length": 23068672
687
- },
688
- "model.layers.16.post_attention_layernorm.weight": {
689
- "dtype": "torch.bfloat16",
690
- "shape": [
691
- 2048
692
- ],
693
- "offset": 0,
694
- "length": 4096
695
- },
696
- "model.layers.16.self_attn.k_proj.weight": {
697
- "dtype": "torch.bfloat16",
698
- "shape": [
699
- 256,
700
- 2048
701
- ],
702
- "offset": 0,
703
- "length": 1048576
704
- },
705
- "model.layers.16.self_attn.o_proj.weight": {
706
- "dtype": "torch.bfloat16",
707
- "shape": [
708
- 2048,
709
- 2048
710
- ],
711
- "offset": 0,
712
- "length": 8388608
713
- },
714
- "model.layers.16.self_attn.q_proj.weight": {
715
- "dtype": "torch.bfloat16",
716
- "shape": [
717
- 2048,
718
- 2048
719
- ],
720
- "offset": 0,
721
- "length": 8388608
722
- },
723
- "model.layers.16.self_attn.v_proj.weight": {
724
- "dtype": "torch.bfloat16",
725
- "shape": [
726
- 256,
727
- 2048
728
- ],
729
- "offset": 0,
730
- "length": 1048576
731
- },
732
- "model.layers.17.input_layernorm.weight": {
733
- "dtype": "torch.bfloat16",
734
- "shape": [
735
- 2048
736
- ],
737
- "offset": 0,
738
- "length": 4096
739
- },
740
- "model.layers.17.mlp.down_proj.weight": {
741
- "dtype": "torch.bfloat16",
742
- "shape": [
743
- 2048,
744
- 5632
745
- ],
746
- "offset": 0,
747
- "length": 23068672
748
- },
749
- "model.layers.17.mlp.gate_proj.weight": {
750
- "dtype": "torch.bfloat16",
751
- "shape": [
752
- 5632,
753
- 2048
754
- ],
755
- "offset": 0,
756
- "length": 23068672
757
- },
758
- "model.layers.17.mlp.up_proj.weight": {
759
- "dtype": "torch.bfloat16",
760
- "shape": [
761
- 5632,
762
- 2048
763
- ],
764
- "offset": 0,
765
- "length": 23068672
766
- },
767
- "model.layers.17.post_attention_layernorm.weight": {
768
- "dtype": "torch.bfloat16",
769
- "shape": [
770
- 2048
771
- ],
772
- "offset": 0,
773
- "length": 4096
774
- },
775
- "model.layers.17.self_attn.k_proj.weight": {
776
- "dtype": "torch.bfloat16",
777
- "shape": [
778
- 256,
779
- 2048
780
- ],
781
- "offset": 0,
782
- "length": 1048576
783
- },
784
- "model.layers.17.self_attn.o_proj.weight": {
785
- "dtype": "torch.bfloat16",
786
- "shape": [
787
- 2048,
788
- 2048
789
- ],
790
- "offset": 0,
791
- "length": 8388608
792
- },
793
- "model.layers.17.self_attn.q_proj.weight": {
794
- "dtype": "torch.bfloat16",
795
- "shape": [
796
- 2048,
797
- 2048
798
- ],
799
- "offset": 0,
800
- "length": 8388608
801
- },
802
- "model.layers.17.self_attn.v_proj.weight": {
803
- "dtype": "torch.bfloat16",
804
- "shape": [
805
- 256,
806
- 2048
807
- ],
808
- "offset": 0,
809
- "length": 1048576
810
- },
811
- "model.layers.18.input_layernorm.weight": {
812
- "dtype": "torch.bfloat16",
813
- "shape": [
814
- 2048
815
- ],
816
- "offset": 0,
817
- "length": 4096
818
- },
819
- "model.layers.18.mlp.down_proj.weight": {
820
- "dtype": "torch.bfloat16",
821
- "shape": [
822
- 2048,
823
- 5632
824
- ],
825
- "offset": 0,
826
- "length": 23068672
827
- },
828
- "model.layers.18.mlp.gate_proj.weight": {
829
- "dtype": "torch.bfloat16",
830
- "shape": [
831
- 5632,
832
- 2048
833
- ],
834
- "offset": 0,
835
- "length": 23068672
836
- },
837
- "model.layers.18.mlp.up_proj.weight": {
838
- "dtype": "torch.bfloat16",
839
- "shape": [
840
- 5632,
841
- 2048
842
- ],
843
- "offset": 0,
844
- "length": 23068672
845
- },
846
- "model.layers.18.post_attention_layernorm.weight": {
847
- "dtype": "torch.bfloat16",
848
- "shape": [
849
- 2048
850
- ],
851
- "offset": 0,
852
- "length": 4096
853
- },
854
- "model.layers.18.self_attn.k_proj.weight": {
855
- "dtype": "torch.bfloat16",
856
- "shape": [
857
- 256,
858
- 2048
859
- ],
860
- "offset": 0,
861
- "length": 1048576
862
- },
863
- "model.layers.18.self_attn.o_proj.weight": {
864
- "dtype": "torch.bfloat16",
865
- "shape": [
866
- 2048,
867
- 2048
868
- ],
869
- "offset": 0,
870
- "length": 8388608
871
- },
872
- "model.layers.18.self_attn.q_proj.weight": {
873
- "dtype": "torch.bfloat16",
874
- "shape": [
875
- 2048,
876
- 2048
877
- ],
878
- "offset": 0,
879
- "length": 8388608
880
- },
881
- "model.layers.18.self_attn.v_proj.weight": {
882
- "dtype": "torch.bfloat16",
883
- "shape": [
884
- 256,
885
- 2048
886
- ],
887
- "offset": 0,
888
- "length": 1048576
889
- },
890
- "model.layers.19.input_layernorm.weight": {
891
- "dtype": "torch.bfloat16",
892
- "shape": [
893
- 2048
894
- ],
895
- "offset": 0,
896
- "length": 4096
897
- },
898
- "model.layers.19.mlp.down_proj.weight": {
899
- "dtype": "torch.bfloat16",
900
- "shape": [
901
- 2048,
902
- 5632
903
- ],
904
- "offset": 0,
905
- "length": 23068672
906
- },
907
- "model.layers.19.mlp.gate_proj.weight": {
908
- "dtype": "torch.bfloat16",
909
- "shape": [
910
- 5632,
911
- 2048
912
- ],
913
- "offset": 0,
914
- "length": 23068672
915
- },
916
- "model.layers.19.mlp.up_proj.weight": {
917
- "dtype": "torch.bfloat16",
918
- "shape": [
919
- 5632,
920
- 2048
921
- ],
922
- "offset": 0,
923
- "length": 23068672
924
- },
925
- "model.layers.19.post_attention_layernorm.weight": {
926
- "dtype": "torch.bfloat16",
927
- "shape": [
928
- 2048
929
- ],
930
- "offset": 0,
931
- "length": 4096
932
- },
933
- "model.layers.19.self_attn.k_proj.weight": {
934
- "dtype": "torch.bfloat16",
935
- "shape": [
936
- 256,
937
- 2048
938
- ],
939
- "offset": 0,
940
- "length": 1048576
941
- },
942
- "model.layers.19.self_attn.o_proj.weight": {
943
- "dtype": "torch.bfloat16",
944
- "shape": [
945
- 2048,
946
- 2048
947
- ],
948
- "offset": 0,
949
- "length": 8388608
950
- },
951
- "model.layers.19.self_attn.q_proj.weight": {
952
- "dtype": "torch.bfloat16",
953
- "shape": [
954
- 2048,
955
- 2048
956
- ],
957
- "offset": 0,
958
- "length": 8388608
959
- },
960
- "model.layers.19.self_attn.v_proj.weight": {
961
- "dtype": "torch.bfloat16",
962
- "shape": [
963
- 256,
964
- 2048
965
- ],
966
- "offset": 0,
967
- "length": 1048576
968
- },
969
- "model.layers.2.input_layernorm.weight": {
970
- "dtype": "torch.bfloat16",
971
- "shape": [
972
- 2048
973
- ],
974
- "offset": 0,
975
- "length": 4096
976
- },
977
- "model.layers.2.mlp.down_proj.weight": {
978
- "dtype": "torch.bfloat16",
979
- "shape": [
980
- 2048,
981
- 5632
982
- ],
983
- "offset": 0,
984
- "length": 23068672
985
- },
986
- "model.layers.2.mlp.gate_proj.weight": {
987
- "dtype": "torch.bfloat16",
988
- "shape": [
989
- 5632,
990
- 2048
991
- ],
992
- "offset": 0,
993
- "length": 23068672
994
- },
995
- "model.layers.2.mlp.up_proj.weight": {
996
- "dtype": "torch.bfloat16",
997
- "shape": [
998
- 5632,
999
- 2048
1000
- ],
1001
- "offset": 0,
1002
- "length": 23068672
1003
- },
1004
- "model.layers.2.post_attention_layernorm.weight": {
1005
- "dtype": "torch.bfloat16",
1006
- "shape": [
1007
- 2048
1008
- ],
1009
- "offset": 0,
1010
- "length": 4096
1011
- },
1012
- "model.layers.2.self_attn.k_proj.weight": {
1013
- "dtype": "torch.bfloat16",
1014
- "shape": [
1015
- 256,
1016
- 2048
1017
- ],
1018
- "offset": 0,
1019
- "length": 1048576
1020
- },
1021
- "model.layers.2.self_attn.o_proj.weight": {
1022
- "dtype": "torch.bfloat16",
1023
- "shape": [
1024
- 2048,
1025
- 2048
1026
- ],
1027
- "offset": 0,
1028
- "length": 8388608
1029
- },
1030
- "model.layers.2.self_attn.q_proj.weight": {
1031
- "dtype": "torch.bfloat16",
1032
- "shape": [
1033
- 2048,
1034
- 2048
1035
- ],
1036
- "offset": 0,
1037
- "length": 8388608
1038
- },
1039
- "model.layers.2.self_attn.v_proj.weight": {
1040
- "dtype": "torch.bfloat16",
1041
- "shape": [
1042
- 256,
1043
- 2048
1044
- ],
1045
- "offset": 0,
1046
- "length": 1048576
1047
- },
1048
- "model.layers.20.input_layernorm.weight": {
1049
- "dtype": "torch.bfloat16",
1050
- "shape": [
1051
- 2048
1052
- ],
1053
- "offset": 0,
1054
- "length": 4096
1055
- },
1056
- "model.layers.20.mlp.down_proj.weight": {
1057
- "dtype": "torch.bfloat16",
1058
- "shape": [
1059
- 2048,
1060
- 5632
1061
- ],
1062
- "offset": 0,
1063
- "length": 23068672
1064
- },
1065
- "model.layers.20.mlp.gate_proj.weight": {
1066
- "dtype": "torch.bfloat16",
1067
- "shape": [
1068
- 5632,
1069
- 2048
1070
- ],
1071
- "offset": 0,
1072
- "length": 23068672
1073
- },
1074
- "model.layers.20.mlp.up_proj.weight": {
1075
- "dtype": "torch.bfloat16",
1076
- "shape": [
1077
- 5632,
1078
- 2048
1079
- ],
1080
- "offset": 0,
1081
- "length": 23068672
1082
- },
1083
- "model.layers.20.post_attention_layernorm.weight": {
1084
- "dtype": "torch.bfloat16",
1085
- "shape": [
1086
- 2048
1087
- ],
1088
- "offset": 0,
1089
- "length": 4096
1090
- },
1091
- "model.layers.20.self_attn.k_proj.weight": {
1092
- "dtype": "torch.bfloat16",
1093
- "shape": [
1094
- 256,
1095
- 2048
1096
- ],
1097
- "offset": 0,
1098
- "length": 1048576
1099
- },
1100
- "model.layers.20.self_attn.o_proj.weight": {
1101
- "dtype": "torch.bfloat16",
1102
- "shape": [
1103
- 2048,
1104
- 2048
1105
- ],
1106
- "offset": 0,
1107
- "length": 8388608
1108
- },
1109
- "model.layers.20.self_attn.q_proj.weight": {
1110
- "dtype": "torch.bfloat16",
1111
- "shape": [
1112
- 2048,
1113
- 2048
1114
- ],
1115
- "offset": 0,
1116
- "length": 8388608
1117
- },
1118
- "model.layers.20.self_attn.v_proj.weight": {
1119
- "dtype": "torch.bfloat16",
1120
- "shape": [
1121
- 256,
1122
- 2048
1123
- ],
1124
- "offset": 0,
1125
- "length": 1048576
1126
- },
1127
- "model.layers.21.input_layernorm.weight": {
1128
- "dtype": "torch.bfloat16",
1129
- "shape": [
1130
- 2048
1131
- ],
1132
- "offset": 0,
1133
- "length": 4096
1134
- },
1135
- "model.layers.21.mlp.down_proj.weight": {
1136
- "dtype": "torch.bfloat16",
1137
- "shape": [
1138
- 2048,
1139
- 5632
1140
- ],
1141
- "offset": 0,
1142
- "length": 23068672
1143
- },
1144
- "model.layers.21.mlp.gate_proj.weight": {
1145
- "dtype": "torch.bfloat16",
1146
- "shape": [
1147
- 5632,
1148
- 2048
1149
- ],
1150
- "offset": 0,
1151
- "length": 23068672
1152
- },
1153
- "model.layers.21.mlp.up_proj.weight": {
1154
- "dtype": "torch.bfloat16",
1155
- "shape": [
1156
- 5632,
1157
- 2048
1158
- ],
1159
- "offset": 0,
1160
- "length": 23068672
1161
- },
1162
- "model.layers.21.post_attention_layernorm.weight": {
1163
- "dtype": "torch.bfloat16",
1164
- "shape": [
1165
- 2048
1166
- ],
1167
- "offset": 0,
1168
- "length": 4096
1169
- },
1170
- "model.layers.21.self_attn.k_proj.weight": {
1171
- "dtype": "torch.bfloat16",
1172
- "shape": [
1173
- 256,
1174
- 2048
1175
- ],
1176
- "offset": 0,
1177
- "length": 1048576
1178
- },
1179
- "model.layers.21.self_attn.o_proj.weight": {
1180
- "dtype": "torch.bfloat16",
1181
- "shape": [
1182
- 2048,
1183
- 2048
1184
- ],
1185
- "offset": 0,
1186
- "length": 8388608
1187
- },
1188
- "model.layers.21.self_attn.q_proj.weight": {
1189
- "dtype": "torch.bfloat16",
1190
- "shape": [
1191
- 2048,
1192
- 2048
1193
- ],
1194
- "offset": 0,
1195
- "length": 8388608
1196
- },
1197
- "model.layers.21.self_attn.v_proj.weight": {
1198
- "dtype": "torch.bfloat16",
1199
- "shape": [
1200
- 256,
1201
- 2048
1202
- ],
1203
- "offset": 0,
1204
- "length": 1048576
1205
- },
1206
- "model.layers.3.input_layernorm.weight": {
1207
- "dtype": "torch.bfloat16",
1208
- "shape": [
1209
- 2048
1210
- ],
1211
- "offset": 0,
1212
- "length": 4096
1213
- },
1214
- "model.layers.3.mlp.down_proj.weight": {
1215
- "dtype": "torch.bfloat16",
1216
- "shape": [
1217
- 2048,
1218
- 5632
1219
- ],
1220
- "offset": 0,
1221
- "length": 23068672
1222
- },
1223
- "model.layers.3.mlp.gate_proj.weight": {
1224
- "dtype": "torch.bfloat16",
1225
- "shape": [
1226
- 5632,
1227
- 2048
1228
- ],
1229
- "offset": 0,
1230
- "length": 23068672
1231
- },
1232
- "model.layers.3.mlp.up_proj.weight": {
1233
- "dtype": "torch.bfloat16",
1234
- "shape": [
1235
- 5632,
1236
- 2048
1237
- ],
1238
- "offset": 0,
1239
- "length": 23068672
1240
- },
1241
- "model.layers.3.post_attention_layernorm.weight": {
1242
- "dtype": "torch.bfloat16",
1243
- "shape": [
1244
- 2048
1245
- ],
1246
- "offset": 0,
1247
- "length": 4096
1248
- },
1249
- "model.layers.3.self_attn.k_proj.weight": {
1250
- "dtype": "torch.bfloat16",
1251
- "shape": [
1252
- 256,
1253
- 2048
1254
- ],
1255
- "offset": 0,
1256
- "length": 1048576
1257
- },
1258
- "model.layers.3.self_attn.o_proj.weight": {
1259
- "dtype": "torch.bfloat16",
1260
- "shape": [
1261
- 2048,
1262
- 2048
1263
- ],
1264
- "offset": 0,
1265
- "length": 8388608
1266
- },
1267
- "model.layers.3.self_attn.q_proj.weight": {
1268
- "dtype": "torch.bfloat16",
1269
- "shape": [
1270
- 2048,
1271
- 2048
1272
- ],
1273
- "offset": 0,
1274
- "length": 8388608
1275
- },
1276
- "model.layers.3.self_attn.v_proj.weight": {
1277
- "dtype": "torch.bfloat16",
1278
- "shape": [
1279
- 256,
1280
- 2048
1281
- ],
1282
- "offset": 0,
1283
- "length": 1048576
1284
- },
1285
- "model.layers.4.input_layernorm.weight": {
1286
- "dtype": "torch.bfloat16",
1287
- "shape": [
1288
- 2048
1289
- ],
1290
- "offset": 0,
1291
- "length": 4096
1292
- },
1293
- "model.layers.4.mlp.down_proj.weight": {
1294
- "dtype": "torch.bfloat16",
1295
- "shape": [
1296
- 2048,
1297
- 5632
1298
- ],
1299
- "offset": 0,
1300
- "length": 23068672
1301
- },
1302
- "model.layers.4.mlp.gate_proj.weight": {
1303
- "dtype": "torch.bfloat16",
1304
- "shape": [
1305
- 5632,
1306
- 2048
1307
- ],
1308
- "offset": 0,
1309
- "length": 23068672
1310
- },
1311
- "model.layers.4.mlp.up_proj.weight": {
1312
- "dtype": "torch.bfloat16",
1313
- "shape": [
1314
- 5632,
1315
- 2048
1316
- ],
1317
- "offset": 0,
1318
- "length": 23068672
1319
- },
1320
- "model.layers.4.post_attention_layernorm.weight": {
1321
- "dtype": "torch.bfloat16",
1322
- "shape": [
1323
- 2048
1324
- ],
1325
- "offset": 0,
1326
- "length": 4096
1327
- },
1328
- "model.layers.4.self_attn.k_proj.weight": {
1329
- "dtype": "torch.bfloat16",
1330
- "shape": [
1331
- 256,
1332
- 2048
1333
- ],
1334
- "offset": 0,
1335
- "length": 1048576
1336
- },
1337
- "model.layers.4.self_attn.o_proj.weight": {
1338
- "dtype": "torch.bfloat16",
1339
- "shape": [
1340
- 2048,
1341
- 2048
1342
- ],
1343
- "offset": 0,
1344
- "length": 8388608
1345
- },
1346
- "model.layers.4.self_attn.q_proj.weight": {
1347
- "dtype": "torch.bfloat16",
1348
- "shape": [
1349
- 2048,
1350
- 2048
1351
- ],
1352
- "offset": 0,
1353
- "length": 8388608
1354
- },
1355
- "model.layers.4.self_attn.v_proj.weight": {
1356
- "dtype": "torch.bfloat16",
1357
- "shape": [
1358
- 256,
1359
- 2048
1360
- ],
1361
- "offset": 0,
1362
- "length": 1048576
1363
- },
1364
- "model.layers.5.input_layernorm.weight": {
1365
- "dtype": "torch.bfloat16",
1366
- "shape": [
1367
- 2048
1368
- ],
1369
- "offset": 0,
1370
- "length": 4096
1371
- },
1372
- "model.layers.5.mlp.down_proj.weight": {
1373
- "dtype": "torch.bfloat16",
1374
- "shape": [
1375
- 2048,
1376
- 5632
1377
- ],
1378
- "offset": 0,
1379
- "length": 23068672
1380
- },
1381
- "model.layers.5.mlp.gate_proj.weight": {
1382
- "dtype": "torch.bfloat16",
1383
- "shape": [
1384
- 5632,
1385
- 2048
1386
- ],
1387
- "offset": 0,
1388
- "length": 23068672
1389
- },
1390
- "model.layers.5.mlp.up_proj.weight": {
1391
- "dtype": "torch.bfloat16",
1392
- "shape": [
1393
- 5632,
1394
- 2048
1395
- ],
1396
- "offset": 0,
1397
- "length": 23068672
1398
- },
1399
- "model.layers.5.post_attention_layernorm.weight": {
1400
- "dtype": "torch.bfloat16",
1401
- "shape": [
1402
- 2048
1403
- ],
1404
- "offset": 0,
1405
- "length": 4096
1406
- },
1407
- "model.layers.5.self_attn.k_proj.weight": {
1408
- "dtype": "torch.bfloat16",
1409
- "shape": [
1410
- 256,
1411
- 2048
1412
- ],
1413
- "offset": 0,
1414
- "length": 1048576
1415
- },
1416
- "model.layers.5.self_attn.o_proj.weight": {
1417
- "dtype": "torch.bfloat16",
1418
- "shape": [
1419
- 2048,
1420
- 2048
1421
- ],
1422
- "offset": 0,
1423
- "length": 8388608
1424
- },
1425
- "model.layers.5.self_attn.q_proj.weight": {
1426
- "dtype": "torch.bfloat16",
1427
- "shape": [
1428
- 2048,
1429
- 2048
1430
- ],
1431
- "offset": 0,
1432
- "length": 8388608
1433
- },
1434
- "model.layers.5.self_attn.v_proj.weight": {
1435
- "dtype": "torch.bfloat16",
1436
- "shape": [
1437
- 256,
1438
- 2048
1439
- ],
1440
- "offset": 0,
1441
- "length": 1048576
1442
- },
1443
- "model.layers.6.input_layernorm.weight": {
1444
- "dtype": "torch.bfloat16",
1445
- "shape": [
1446
- 2048
1447
- ],
1448
- "offset": 0,
1449
- "length": 4096
1450
- },
1451
- "model.layers.6.mlp.down_proj.weight": {
1452
- "dtype": "torch.bfloat16",
1453
- "shape": [
1454
- 2048,
1455
- 5632
1456
- ],
1457
- "offset": 0,
1458
- "length": 23068672
1459
- },
1460
- "model.layers.6.mlp.gate_proj.weight": {
1461
- "dtype": "torch.bfloat16",
1462
- "shape": [
1463
- 5632,
1464
- 2048
1465
- ],
1466
- "offset": 0,
1467
- "length": 23068672
1468
- },
1469
- "model.layers.6.mlp.up_proj.weight": {
1470
- "dtype": "torch.bfloat16",
1471
- "shape": [
1472
- 5632,
1473
- 2048
1474
- ],
1475
- "offset": 0,
1476
- "length": 23068672
1477
- },
1478
- "model.layers.6.post_attention_layernorm.weight": {
1479
- "dtype": "torch.bfloat16",
1480
- "shape": [
1481
- 2048
1482
- ],
1483
- "offset": 0,
1484
- "length": 4096
1485
- },
1486
- "model.layers.6.self_attn.k_proj.weight": {
1487
- "dtype": "torch.bfloat16",
1488
- "shape": [
1489
- 256,
1490
- 2048
1491
- ],
1492
- "offset": 0,
1493
- "length": 1048576
1494
- },
1495
- "model.layers.6.self_attn.o_proj.weight": {
1496
- "dtype": "torch.bfloat16",
1497
- "shape": [
1498
- 2048,
1499
- 2048
1500
- ],
1501
- "offset": 0,
1502
- "length": 8388608
1503
- },
1504
- "model.layers.6.self_attn.q_proj.weight": {
1505
- "dtype": "torch.bfloat16",
1506
- "shape": [
1507
- 2048,
1508
- 2048
1509
- ],
1510
- "offset": 0,
1511
- "length": 8388608
1512
- },
1513
- "model.layers.6.self_attn.v_proj.weight": {
1514
- "dtype": "torch.bfloat16",
1515
- "shape": [
1516
- 256,
1517
- 2048
1518
- ],
1519
- "offset": 0,
1520
- "length": 1048576
1521
- },
1522
- "model.layers.7.input_layernorm.weight": {
1523
- "dtype": "torch.bfloat16",
1524
- "shape": [
1525
- 2048
1526
- ],
1527
- "offset": 0,
1528
- "length": 4096
1529
- },
1530
- "model.layers.7.mlp.down_proj.weight": {
1531
- "dtype": "torch.bfloat16",
1532
- "shape": [
1533
- 2048,
1534
- 5632
1535
- ],
1536
- "offset": 0,
1537
- "length": 23068672
1538
- },
1539
- "model.layers.7.mlp.gate_proj.weight": {
1540
- "dtype": "torch.bfloat16",
1541
- "shape": [
1542
- 5632,
1543
- 2048
1544
- ],
1545
- "offset": 0,
1546
- "length": 23068672
1547
- },
1548
- "model.layers.7.mlp.up_proj.weight": {
1549
- "dtype": "torch.bfloat16",
1550
- "shape": [
1551
- 5632,
1552
- 2048
1553
- ],
1554
- "offset": 0,
1555
- "length": 23068672
1556
- },
1557
- "model.layers.7.post_attention_layernorm.weight": {
1558
- "dtype": "torch.bfloat16",
1559
- "shape": [
1560
- 2048
1561
- ],
1562
- "offset": 0,
1563
- "length": 4096
1564
- },
1565
- "model.layers.7.self_attn.k_proj.weight": {
1566
- "dtype": "torch.bfloat16",
1567
- "shape": [
1568
- 256,
1569
- 2048
1570
- ],
1571
- "offset": 0,
1572
- "length": 1048576
1573
- },
1574
- "model.layers.7.self_attn.o_proj.weight": {
1575
- "dtype": "torch.bfloat16",
1576
- "shape": [
1577
- 2048,
1578
- 2048
1579
- ],
1580
- "offset": 0,
1581
- "length": 8388608
1582
- },
1583
- "model.layers.7.self_attn.q_proj.weight": {
1584
- "dtype": "torch.bfloat16",
1585
- "shape": [
1586
- 2048,
1587
- 2048
1588
- ],
1589
- "offset": 0,
1590
- "length": 8388608
1591
- },
1592
- "model.layers.7.self_attn.v_proj.weight": {
1593
- "dtype": "torch.bfloat16",
1594
- "shape": [
1595
- 256,
1596
- 2048
1597
- ],
1598
- "offset": 0,
1599
- "length": 1048576
1600
- },
1601
- "model.layers.8.input_layernorm.weight": {
1602
- "dtype": "torch.bfloat16",
1603
- "shape": [
1604
- 2048
1605
- ],
1606
- "offset": 0,
1607
- "length": 4096
1608
- },
1609
- "model.layers.8.mlp.down_proj.weight": {
1610
- "dtype": "torch.bfloat16",
1611
- "shape": [
1612
- 2048,
1613
- 5632
1614
- ],
1615
- "offset": 0,
1616
- "length": 23068672
1617
- },
1618
- "model.layers.8.mlp.gate_proj.weight": {
1619
- "dtype": "torch.bfloat16",
1620
- "shape": [
1621
- 5632,
1622
- 2048
1623
- ],
1624
- "offset": 0,
1625
- "length": 23068672
1626
- },
1627
- "model.layers.8.mlp.up_proj.weight": {
1628
- "dtype": "torch.bfloat16",
1629
- "shape": [
1630
- 5632,
1631
- 2048
1632
- ],
1633
- "offset": 0,
1634
- "length": 23068672
1635
- },
1636
- "model.layers.8.post_attention_layernorm.weight": {
1637
- "dtype": "torch.bfloat16",
1638
- "shape": [
1639
- 2048
1640
- ],
1641
- "offset": 0,
1642
- "length": 4096
1643
- },
1644
- "model.layers.8.self_attn.k_proj.weight": {
1645
- "dtype": "torch.bfloat16",
1646
- "shape": [
1647
- 256,
1648
- 2048
1649
- ],
1650
- "offset": 0,
1651
- "length": 1048576
1652
- },
1653
- "model.layers.8.self_attn.o_proj.weight": {
1654
- "dtype": "torch.bfloat16",
1655
- "shape": [
1656
- 2048,
1657
- 2048
1658
- ],
1659
- "offset": 0,
1660
- "length": 8388608
1661
- },
1662
- "model.layers.8.self_attn.q_proj.weight": {
1663
- "dtype": "torch.bfloat16",
1664
- "shape": [
1665
- 2048,
1666
- 2048
1667
- ],
1668
- "offset": 0,
1669
- "length": 8388608
1670
- },
1671
- "model.layers.8.self_attn.v_proj.weight": {
1672
- "dtype": "torch.bfloat16",
1673
- "shape": [
1674
- 256,
1675
- 2048
1676
- ],
1677
- "offset": 0,
1678
- "length": 1048576
1679
- },
1680
- "model.layers.9.input_layernorm.weight": {
1681
- "dtype": "torch.bfloat16",
1682
- "shape": [
1683
- 2048
1684
- ],
1685
- "offset": 0,
1686
- "length": 4096
1687
- },
1688
- "model.layers.9.mlp.down_proj.weight": {
1689
- "dtype": "torch.bfloat16",
1690
- "shape": [
1691
- 2048,
1692
- 5632
1693
- ],
1694
- "offset": 0,
1695
- "length": 23068672
1696
- },
1697
- "model.layers.9.mlp.gate_proj.weight": {
1698
- "dtype": "torch.bfloat16",
1699
- "shape": [
1700
- 5632,
1701
- 2048
1702
- ],
1703
- "offset": 0,
1704
- "length": 23068672
1705
- },
1706
- "model.layers.9.mlp.up_proj.weight": {
1707
- "dtype": "torch.bfloat16",
1708
- "shape": [
1709
- 5632,
1710
- 2048
1711
- ],
1712
- "offset": 0,
1713
- "length": 23068672
1714
- },
1715
- "model.layers.9.post_attention_layernorm.weight": {
1716
- "dtype": "torch.bfloat16",
1717
- "shape": [
1718
- 2048
1719
- ],
1720
- "offset": 0,
1721
- "length": 4096
1722
- },
1723
- "model.layers.9.self_attn.k_proj.weight": {
1724
- "dtype": "torch.bfloat16",
1725
- "shape": [
1726
- 256,
1727
- 2048
1728
- ],
1729
- "offset": 0,
1730
- "length": 1048576
1731
- },
1732
- "model.layers.9.self_attn.o_proj.weight": {
1733
- "dtype": "torch.bfloat16",
1734
- "shape": [
1735
- 2048,
1736
- 2048
1737
- ],
1738
- "offset": 0,
1739
- "length": 8388608
1740
- },
1741
- "model.layers.9.self_attn.q_proj.weight": {
1742
- "dtype": "torch.bfloat16",
1743
- "shape": [
1744
- 2048,
1745
- 2048
1746
- ],
1747
- "offset": 0,
1748
- "length": 8388608
1749
- },
1750
- "model.layers.9.self_attn.v_proj.weight": {
1751
- "dtype": "torch.bfloat16",
1752
- "shape": [
1753
- 256,
1754
- 2048
1755
- ],
1756
- "offset": 0,
1757
- "length": 1048576
1758
- },
1759
- "model.norm.weight": {
1760
- "dtype": "torch.bfloat16",
1761
- "shape": [
1762
- 2048
1763
- ],
1764
- "offset": 0,
1765
- "length": 4096
1766
- }
1767
  },
1768
  "weight_map": {
1769
  "lm_head.weight": "model.safetensors",
 
1
  {
2
+ "metadata": {
3
+ "total_size": 2200096768
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model.safetensors",