|
{ |
|
"metadata": { |
|
"ParamSize": 291, |
|
"ParamBytes": 39722299392.0, |
|
"BitsPerParam": 14.56926321506206 |
|
}, |
|
"records": [ |
|
{ |
|
"dataPath": "params_shard_0.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.0.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7db413de247aca08fe9236a2e9090e48" |
|
}, |
|
{ |
|
"dataPath": "params_shard_1.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.0.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "59c77c1eb45dcbec5f24042796d014fd" |
|
}, |
|
{ |
|
"dataPath": "params_shard_2.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.0.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "66271a8bfdc881d530bddce423a16473" |
|
}, |
|
{ |
|
"dataPath": "params_shard_3.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.0.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "5e6ad79422b84ab6817e84ce1eae9142" |
|
}, |
|
{ |
|
"dataPath": "params_shard_4.bin", |
|
"format": "raw-shard", |
|
"nbytes": 1137180672, |
|
"records": [ |
|
{ |
|
"name": "model.tok_embeddings.weight", |
|
"shape": [ |
|
92544, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 1137180672, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "c2c0dcdaa5fb65dc27c3af77f4be9222" |
|
}, |
|
{ |
|
"dataPath": "params_shard_5.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.1.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "6a67d00fca1fb44ec6c145f25edcf09d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_6.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.1.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0f3bce60bc68c6b0486ab25e032f1bef" |
|
}, |
|
{ |
|
"dataPath": "params_shard_7.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.1.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "a56910c6a122b400b1b78632935484e4" |
|
}, |
|
{ |
|
"dataPath": "params_shard_8.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.1.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "a78aaa58397280571207a00af537581c" |
|
}, |
|
{ |
|
"dataPath": "params_shard_9.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.2.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "cbbc42abfea33905e066e923b4fa5615" |
|
}, |
|
{ |
|
"dataPath": "params_shard_10.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.2.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "3fb14b1507ee68a3cb2da640bf5f1621" |
|
}, |
|
{ |
|
"dataPath": "params_shard_11.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.2.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0c3060a8a29e05e7fee9983220c66142" |
|
}, |
|
{ |
|
"dataPath": "params_shard_12.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.2.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7565e5436c7cebbe2d0da90a2d314ee7" |
|
}, |
|
{ |
|
"dataPath": "params_shard_13.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.3.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0df3bec71638aad48c3f6fdf43250582" |
|
}, |
|
{ |
|
"dataPath": "params_shard_14.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.3.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "cded647762891145b4f2708cfb0219ce" |
|
}, |
|
{ |
|
"dataPath": "params_shard_15.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.3.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "6c0da8fb8b983d34d16a700a4b026219" |
|
}, |
|
{ |
|
"dataPath": "params_shard_16.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.10.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "3aa943f7c89f892a6ff2cc6c5dcf97bd" |
|
}, |
|
{ |
|
"dataPath": "params_shard_17.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.10.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ef650d89e9f5561640e879d433eb9291" |
|
}, |
|
{ |
|
"dataPath": "params_shard_18.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.10.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "a59efb340313927ff568bb83d6189269" |
|
}, |
|
{ |
|
"dataPath": "params_shard_19.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.10.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "140bc29d20ec55db204d76c7757910d8" |
|
}, |
|
{ |
|
"dataPath": "params_shard_20.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.8.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "a45245fb0d0dcfadfca2ebb59d27b11f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_21.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.8.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "6089e29b51b9445b391472dba762a4ae" |
|
}, |
|
{ |
|
"dataPath": "params_shard_22.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.9.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "67f22370f2e77097c0dd66e71dbed781" |
|
}, |
|
{ |
|
"dataPath": "params_shard_23.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.9.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "d0f49513aa0a3a998616d7fac6c31783" |
|
}, |
|
{ |
|
"dataPath": "params_shard_24.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.9.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7f875669b4b20e1a195b3d6fe124b54e" |
|
}, |
|
{ |
|
"dataPath": "params_shard_25.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.9.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "b2abe5a96278a3aa700575d7c3974913" |
|
}, |
|
{ |
|
"dataPath": "params_shard_26.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.11.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "115da155e91aedc832328763ea5fe0db" |
|
}, |
|
{ |
|
"dataPath": "params_shard_27.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.11.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0f7ebef9ec340a3a76111f828a655fbf" |
|
}, |
|
{ |
|
"dataPath": "params_shard_28.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.11.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "2f98db679b023feef88e6e6161ca559e" |
|
}, |
|
{ |
|
"dataPath": "params_shard_29.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.11.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "91c1e7ace4cc6d5a811ffbe9e2091b82" |
|
}, |
|
{ |
|
"dataPath": "params_shard_30.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.12.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0c127b17b7f497e819bfad9366395efd" |
|
}, |
|
{ |
|
"dataPath": "params_shard_31.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.12.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "3c8bbddb85a8a60221b60a36392dae0e" |
|
}, |
|
{ |
|
"dataPath": "params_shard_32.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.12.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "65e865d0402bd45bf47bdc53124ca7ab" |
|
}, |
|
{ |
|
"dataPath": "params_shard_33.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.12.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f72453e64e6b45746f737ba3e873ad8f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_34.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.13.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "bf8df85329a7581d062da7a3c49cea76" |
|
}, |
|
{ |
|
"dataPath": "params_shard_35.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.13.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f4607212cc716ca83ed380c0b7d8226d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_36.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.13.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "33e947cea8860a6d7ca378a3c7e8f47f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_37.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.13.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "2d2fbaa70fe5504c6893bb00bd341b15" |
|
}, |
|
{ |
|
"dataPath": "params_shard_38.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.14.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "58a7fae456e781a6349d68341fd472e7" |
|
}, |
|
{ |
|
"dataPath": "params_shard_39.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.14.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "aad5026e5d5235e5095116244220c107" |
|
}, |
|
{ |
|
"dataPath": "params_shard_40.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.14.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f2bd511d42a447d508b23d9fc00cb071" |
|
}, |
|
{ |
|
"dataPath": "params_shard_41.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.14.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "79364dac6fa081b3497ed2a0f9899321" |
|
}, |
|
{ |
|
"dataPath": "params_shard_42.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.15.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "376f15535d3f62aa3f0b6891546d6118" |
|
}, |
|
{ |
|
"dataPath": "params_shard_43.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.15.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "2c414d31013d54a7372866bff2a3e905" |
|
}, |
|
{ |
|
"dataPath": "params_shard_44.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.15.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7c41335c011514c3c6e3b6fc998f1dc7" |
|
}, |
|
{ |
|
"dataPath": "params_shard_45.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.15.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "8a450e3c401107275f5d32c1234b6aa8" |
|
}, |
|
{ |
|
"dataPath": "params_shard_46.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.16.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "deadbfc6d8875d5e6cdad4cefa3685fb" |
|
}, |
|
{ |
|
"dataPath": "params_shard_47.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.16.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "cbb9e3961a34277734f849e45866714a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_48.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.16.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f5a4ce98c5d2e52493925a19c7654adf" |
|
}, |
|
{ |
|
"dataPath": "params_shard_49.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.16.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "442cb65ef56d6751250fec205f32206d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_50.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.17.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "996c44fc4a143c6d313a6c1ab33751db" |
|
}, |
|
{ |
|
"dataPath": "params_shard_51.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.17.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "03f8715bb6374a621fcc498bddafdca1" |
|
}, |
|
{ |
|
"dataPath": "params_shard_52.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.17.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "d00a5c827c10b9efd8b963c56db13cea" |
|
}, |
|
{ |
|
"dataPath": "params_shard_53.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.17.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "1117c3033d8d3ac0b0d5a30ab12fefb6" |
|
}, |
|
{ |
|
"dataPath": "params_shard_54.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.18.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "39fb853910df32a025a6eb9ca4a25473" |
|
}, |
|
{ |
|
"dataPath": "params_shard_55.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.18.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "34904a27391a85623384e5da29c38e60" |
|
}, |
|
{ |
|
"dataPath": "params_shard_56.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.18.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "2a3eaef32fc92ccb6871327c8b875f5c" |
|
}, |
|
{ |
|
"dataPath": "params_shard_57.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.18.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "63e9e39b6cff6bc320e6cea70ba69639" |
|
}, |
|
{ |
|
"dataPath": "params_shard_58.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.19.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "a0b4ba9b944d8dbf07da9c0d087c1ba4" |
|
}, |
|
{ |
|
"dataPath": "params_shard_59.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.19.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "103771179c443ce4f4e28e7e06aebb20" |
|
}, |
|
{ |
|
"dataPath": "params_shard_60.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.19.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7e687c9999b496d0009fd5635a48f33d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_61.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.19.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "fc458af151395e439cac311eba2227bc" |
|
}, |
|
{ |
|
"dataPath": "params_shard_62.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.20.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "4b75a822656f9d5ef019b4aebbb86568" |
|
}, |
|
{ |
|
"dataPath": "params_shard_63.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.20.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "72d2fe17844cf036d734bd591202e73f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_64.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.20.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0b3cebdf40ae164954edabaed15831b0" |
|
}, |
|
{ |
|
"dataPath": "params_shard_65.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.20.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7fc53cdd069a070f875ea52d2f34a00d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_66.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.21.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "22e5b73efc709a50a55bee29ac9057df" |
|
}, |
|
{ |
|
"dataPath": "params_shard_67.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.21.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "4ce4eba3c2fe8fbebc02a092edecdd7f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_68.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.21.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "de936b13fa07faeca154116205e9d2eb" |
|
}, |
|
{ |
|
"dataPath": "params_shard_69.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.21.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7804e21972af4a0a98c4942116e28b6a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_70.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.22.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "5fce8a96d1bf435bd8dc33611ddbf449" |
|
}, |
|
{ |
|
"dataPath": "params_shard_71.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.22.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0fc9ce7067c18cf479452ef08dcecb3b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_72.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.22.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "4271a3890431078cc5ec4be13cb273f1" |
|
}, |
|
{ |
|
"dataPath": "params_shard_73.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.22.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "d03f2f509167fa77b85e331257422ba9" |
|
}, |
|
{ |
|
"dataPath": "params_shard_74.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.23.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f026f30b4b7f1fcccaf64e6aaf938462" |
|
}, |
|
{ |
|
"dataPath": "params_shard_75.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.23.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "66d19ca9fee7430684548cce174d4e13" |
|
}, |
|
{ |
|
"dataPath": "params_shard_76.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.23.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "69a9e86d60c5ba00ff45ccf02794b67b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_77.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.23.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "167de8311549bc8da52b1682e5bd7b44" |
|
}, |
|
{ |
|
"dataPath": "params_shard_78.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.24.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "779d094bb1c6cce6debfa64b638f5e61" |
|
}, |
|
{ |
|
"dataPath": "params_shard_79.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.24.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "3ea567219c3af38665ed09b6d1b16e2d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_80.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.24.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "2296ab0d0df0cc8d1a4bd3a8a5e06f4c" |
|
}, |
|
{ |
|
"dataPath": "params_shard_81.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.24.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "aa990ed8557bc5a8e003486d56f4e187" |
|
}, |
|
{ |
|
"dataPath": "params_shard_82.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.25.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "58b0ca9f82716be7e75b4fb7455b1e0f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_83.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.25.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0c0aebabe5bacb9624c63a0c6a2a4982" |
|
}, |
|
{ |
|
"dataPath": "params_shard_84.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.25.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ae149d0cbec934811f4fd3a4d28ae2fd" |
|
}, |
|
{ |
|
"dataPath": "params_shard_85.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.25.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "35390a0c485b710883f77d26dc145867" |
|
}, |
|
{ |
|
"dataPath": "params_shard_86.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.26.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "abe647676c59ff8962a8c57567ddd83a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_87.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.26.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "234c054cc614010c6798441f9f33617b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_88.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.26.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "dbbab3c909bc282209abe32d6f29820b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_89.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.26.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "43bca02513e73101ecc185d9e9efa6b5" |
|
}, |
|
{ |
|
"dataPath": "params_shard_90.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.27.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "95e85002434e9c1d8695f865ce51ebdb" |
|
}, |
|
{ |
|
"dataPath": "params_shard_91.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.27.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ed986c68569f42b1c0d0dc3f4ed884c5" |
|
}, |
|
{ |
|
"dataPath": "params_shard_92.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.27.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "64bf6132b570a610b7247f680862f2b0" |
|
}, |
|
{ |
|
"dataPath": "params_shard_93.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.27.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "97257a4bf41f98824cd5c30a4fa53073" |
|
}, |
|
{ |
|
"dataPath": "params_shard_94.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.28.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "394ed581bc5d2e2998d06a4c3a028b33" |
|
}, |
|
{ |
|
"dataPath": "params_shard_95.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.28.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "96899c819298dbdeb12c7789383ed44d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_96.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.28.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "5bf4c2b3bf9c19b599d4d9c3bba6d73c" |
|
}, |
|
{ |
|
"dataPath": "params_shard_97.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.28.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "c1b9e2eda5bf8720513b8c8f65bd943a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_98.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.29.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "c0a1708ab31208cdd0c6d5363d6d8093" |
|
}, |
|
{ |
|
"dataPath": "params_shard_99.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.29.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "838bd986ce2b844f216547d20c13b95e" |
|
}, |
|
{ |
|
"dataPath": "params_shard_100.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.29.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "755c0156a106a48c4f09b4d20db1b948" |
|
}, |
|
{ |
|
"dataPath": "params_shard_101.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.29.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f425cc44a1efd94696cc7e9de4ca49c4" |
|
}, |
|
{ |
|
"dataPath": "params_shard_102.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.30.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "9386cb4e7eb3d5ee5a979bb7ac401c14" |
|
}, |
|
{ |
|
"dataPath": "params_shard_103.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.30.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "86a6705a6e9371f902e0be4c636bc4a5" |
|
}, |
|
{ |
|
"dataPath": "params_shard_104.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.30.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ddf2fad7986595d974215da056b5fbf8" |
|
}, |
|
{ |
|
"dataPath": "params_shard_105.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.30.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "df3f83c9f0b140cade318c7935ecfae6" |
|
}, |
|
{ |
|
"dataPath": "params_shard_106.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.3.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "1afed988133967734c5b986e67fa77f9" |
|
}, |
|
{ |
|
"dataPath": "params_shard_107.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.4.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "208154e4e96d7b69943d25dbaea017e0" |
|
}, |
|
{ |
|
"dataPath": "params_shard_108.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.4.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "e93ef785e28cd634b7c9fa27a2302e89" |
|
}, |
|
{ |
|
"dataPath": "params_shard_109.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.4.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "dbb3f9f1c03e11b8979f5e5c71b97161" |
|
}, |
|
{ |
|
"dataPath": "params_shard_110.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.4.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "b2047ed1a305ce22e9033c3087ea6dd1" |
|
}, |
|
{ |
|
"dataPath": "params_shard_111.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.5.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "9e4f4bbbd333758f10304c222b059adf" |
|
}, |
|
{ |
|
"dataPath": "params_shard_112.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.5.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "621902bde2f85d5f7b769d9edec80627" |
|
}, |
|
{ |
|
"dataPath": "params_shard_113.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.5.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "bd0ff996707fdbd4014b85e59a9902a7" |
|
}, |
|
{ |
|
"dataPath": "params_shard_114.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.5.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "4e26cb8217bba4d5146f3e379bc16a5a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_115.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.31.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "a7c7b64f3dfa86ce363887dbb9cd513e" |
|
}, |
|
{ |
|
"dataPath": "params_shard_116.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.31.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ad296d6a68401a33255105f1357b42b5" |
|
}, |
|
{ |
|
"dataPath": "params_shard_117.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.31.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "c5f0790a4f97440bd213fb188a3af04b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_118.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.31.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "bb56c06177c45c5bd2918981fa0cc481" |
|
}, |
|
{ |
|
"dataPath": "params_shard_119.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.32.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "08b57ff23c3674814561cede73380547" |
|
}, |
|
{ |
|
"dataPath": "params_shard_120.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.32.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "e58867d7ac6d2ec5c9b4ebea874cef29" |
|
}, |
|
{ |
|
"dataPath": "params_shard_121.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.32.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "df1b606f74f2f5be355a3520e19772dd" |
|
}, |
|
{ |
|
"dataPath": "params_shard_122.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.32.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f1efc78efe9c02501a66cfb689cf6a3c" |
|
}, |
|
{ |
|
"dataPath": "params_shard_123.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.33.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "5da48a915e2929f04ec1396efecb0c11" |
|
}, |
|
{ |
|
"dataPath": "params_shard_124.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.33.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "d4d9c37a234cd8036d9ea0017d411ffe" |
|
}, |
|
{ |
|
"dataPath": "params_shard_125.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.33.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "af43da9fdb44e7935315c9cb21836bd0" |
|
}, |
|
{ |
|
"dataPath": "params_shard_126.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.33.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "c4d0cb7fb30a658097c55565769664a4" |
|
}, |
|
{ |
|
"dataPath": "params_shard_127.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.34.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f469789ef1e085ab677689b7a1676fbe" |
|
}, |
|
{ |
|
"dataPath": "params_shard_128.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.34.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "9a0a4f84967d2300b4e53f2e756729e0" |
|
}, |
|
{ |
|
"dataPath": "params_shard_129.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.34.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "10365a52603934a5d50603ff4330703a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_130.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.34.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "b8029e5306d1592191b2723a18600d45" |
|
}, |
|
{ |
|
"dataPath": "params_shard_131.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.35.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7556d983866e211fa47eb789514fb419" |
|
}, |
|
{ |
|
"dataPath": "params_shard_132.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.35.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "55d01740e75910478c7f74ec12a03d91" |
|
}, |
|
{ |
|
"dataPath": "params_shard_133.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.35.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "917a37e221e779cb91538f8688e2652e" |
|
}, |
|
{ |
|
"dataPath": "params_shard_134.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.35.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "bdd848bc9a8851a6bdd5267d82e93d1d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_135.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.36.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "669c98169ce559d5dea183321e2d1f77" |
|
}, |
|
{ |
|
"dataPath": "params_shard_136.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.36.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7872deaa142c04564b60ecf747d6c64e" |
|
}, |
|
{ |
|
"dataPath": "params_shard_137.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.36.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f3be3dc845e43f554795f99cdfcfe056" |
|
}, |
|
{ |
|
"dataPath": "params_shard_138.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.36.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "604a687ccc4eda5384c0cdd6bfb7ce8c" |
|
}, |
|
{ |
|
"dataPath": "params_shard_139.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.37.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "c8d84ec208254fedf2a501cf11387b5b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_140.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.37.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "a65bb61f3410797558e33f35224da13a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_141.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.37.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "6797a4c7ef7f2259e464bf163d050846" |
|
}, |
|
{ |
|
"dataPath": "params_shard_142.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.37.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "536829d2be23bd13a427d6bc71209e86" |
|
}, |
|
{ |
|
"dataPath": "params_shard_143.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.38.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "0400791d56834f98233c6d49c0551cb4" |
|
}, |
|
{ |
|
"dataPath": "params_shard_144.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.38.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "b0fb70adc1ae7a7ccce055f7e14a860f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_145.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.38.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "d6edf85c6e98e21bc1c20e19711e9d0a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_146.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.38.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "cf7deb1a5452e19b9555e838e76e8d53" |
|
}, |
|
{ |
|
"dataPath": "params_shard_147.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.39.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7aa85dd5098c8da2322d847f135c82e4" |
|
}, |
|
{ |
|
"dataPath": "params_shard_148.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.39.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "2e3dadee443611c5c500e209923f40f2" |
|
}, |
|
{ |
|
"dataPath": "params_shard_149.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.39.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ae5ff02ddc94b63e22feafa08835eadf" |
|
}, |
|
{ |
|
"dataPath": "params_shard_150.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.39.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "cd40690067c1fc56e5691dc42f9573dc" |
|
}, |
|
{ |
|
"dataPath": "params_shard_151.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.40.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "bca8b308788f3142f45b18eb32d79d01" |
|
}, |
|
{ |
|
"dataPath": "params_shard_152.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.40.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "557e4ad17874e2552be46fb22818ec1c" |
|
}, |
|
{ |
|
"dataPath": "params_shard_153.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.40.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "aaea8ca7014a58e446d285a8ddfefe09" |
|
}, |
|
{ |
|
"dataPath": "params_shard_154.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.40.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ef63b0787d5a92af34ca536bb84f7164" |
|
}, |
|
{ |
|
"dataPath": "params_shard_155.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.41.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "05dcca9cd56a9636a9484df68b068351" |
|
}, |
|
{ |
|
"dataPath": "params_shard_156.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.41.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "89e72bdc3a6de41a45f81f8062bc9957" |
|
}, |
|
{ |
|
"dataPath": "params_shard_157.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.41.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "f3c856eb9e9de74f6d0cc852d3b8b921" |
|
}, |
|
{ |
|
"dataPath": "params_shard_158.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.41.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "83d2bb1e1ee58fa9e75650b7f166ece2" |
|
}, |
|
{ |
|
"dataPath": "params_shard_159.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.42.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "9a07a3bb1028bdb25065cc80d6ff5371" |
|
}, |
|
{ |
|
"dataPath": "params_shard_160.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.42.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "8274125b1c0b68ff93ef8b9d983a3033" |
|
}, |
|
{ |
|
"dataPath": "params_shard_161.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.42.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "8ee5fd9692c64c3db42bf23f398d26ce" |
|
}, |
|
{ |
|
"dataPath": "params_shard_162.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.42.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "3ecfb92f2e0dbb32a9eeca40890341ce" |
|
}, |
|
{ |
|
"dataPath": "params_shard_163.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.43.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "3aa9885182a7319e2437f23d31342ef1" |
|
}, |
|
{ |
|
"dataPath": "params_shard_164.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.43.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "fd5619a8fe09763661d26c3d561208a0" |
|
}, |
|
{ |
|
"dataPath": "params_shard_165.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.43.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "1d162302debd25d0738ebc27e3845f6d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_166.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.43.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "e4a91e37cd73d9771f0582183591e19b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_167.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.44.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "bed296e48e01809cb8212c76825a665b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_168.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.44.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "08b639d0c18fcbf7c1a63fb749c5fa9b" |
|
}, |
|
{ |
|
"dataPath": "params_shard_169.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.44.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7709a967a0c53f0efc08eeb59241cd4e" |
|
}, |
|
{ |
|
"dataPath": "params_shard_170.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.44.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "143bc4d87bca35dc24a66f9c75c7e115" |
|
}, |
|
{ |
|
"dataPath": "params_shard_171.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.45.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "55ba57cff3ea364b21d309c6913dce62" |
|
}, |
|
{ |
|
"dataPath": "params_shard_172.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.45.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "b915ec4f1a2bd7b9dd4caf2280583c7c" |
|
}, |
|
{ |
|
"dataPath": "params_shard_173.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.45.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "966fb0b1ad391b49d663ef61a7097c5d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_174.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.45.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ca0ae515b744050af3357f02553ee0a2" |
|
}, |
|
{ |
|
"dataPath": "params_shard_175.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.46.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "975731a3575a366de954484c040611d2" |
|
}, |
|
{ |
|
"dataPath": "params_shard_176.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.46.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "a7a90fffbc267a8794a0d749a395466a" |
|
}, |
|
{ |
|
"dataPath": "params_shard_177.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.46.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "091009488a5c71860f1887ef965c433f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_178.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.46.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "bbba14991bf109f5a4343bde92618bcf" |
|
}, |
|
{ |
|
"dataPath": "params_shard_179.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.47.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "5af00b0e44df026910ce20f1ce1ea148" |
|
}, |
|
{ |
|
"dataPath": "params_shard_180.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.47.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ae2639212fe60abadedffff3988c2467" |
|
}, |
|
{ |
|
"dataPath": "params_shard_181.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.47.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "01f1fae460e95c1a2b4a4698d6491a7f" |
|
}, |
|
{ |
|
"dataPath": "params_shard_182.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.47.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "e35e3802e509e8248c9d0d65ffb4d84d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_183.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.6.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "000574e1f5c50c785709e320aae224be" |
|
}, |
|
{ |
|
"dataPath": "params_shard_184.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.6.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ece6470c49ccf429481fac9d62cdb081" |
|
}, |
|
{ |
|
"dataPath": "params_shard_185.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.6.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "982b234ab6c6dbb3af157be8426f6448" |
|
}, |
|
{ |
|
"dataPath": "params_shard_186.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.6.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "7dbef8765e3ff403d9f3a26e33cbece6" |
|
}, |
|
{ |
|
"dataPath": "params_shard_187.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.7.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "63a11aa5b639ae8a4b92c37f8d3206e7" |
|
}, |
|
{ |
|
"dataPath": "params_shard_188.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.7.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "5244855502245015ee7e5e293593aebd" |
|
}, |
|
{ |
|
"dataPath": "params_shard_189.bin", |
|
"format": "raw-shard", |
|
"nbytes": 402653184, |
|
"records": [ |
|
{ |
|
"name": "model.layers.7.feed_forward.gate_up_proj.weight", |
|
"shape": [ |
|
32768, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 402653184, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "e81ede3b54e31a30cf854b89a1ff3944" |
|
}, |
|
{ |
|
"dataPath": "params_shard_190.bin", |
|
"format": "raw-shard", |
|
"nbytes": 201326592, |
|
"records": [ |
|
{ |
|
"name": "model.layers.7.feed_forward.w2.weight", |
|
"shape": [ |
|
6144, |
|
16384 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 201326592, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "d44a76d8f61f376a4268aef32ed059d7" |
|
}, |
|
{ |
|
"dataPath": "params_shard_191.bin", |
|
"format": "raw-shard", |
|
"nbytes": 75497472, |
|
"records": [ |
|
{ |
|
"name": "model.layers.8.attention.wo.weight", |
|
"shape": [ |
|
6144, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 75497472, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "ef10714372f5ad230109ebaca8a4c09d" |
|
}, |
|
{ |
|
"dataPath": "params_shard_192.bin", |
|
"format": "raw-shard", |
|
"nbytes": 100663296, |
|
"records": [ |
|
{ |
|
"name": "model.layers.8.attention.wqkv.weight", |
|
"shape": [ |
|
8192, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 100663296, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "97179e5140290259938be5fe5033d0b1" |
|
}, |
|
{ |
|
"dataPath": "params_shard_193.bin", |
|
"format": "raw-shard", |
|
"nbytes": 1137180672, |
|
"records": [ |
|
{ |
|
"name": "output.weight", |
|
"shape": [ |
|
92544, |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 1137180672, |
|
"byteOffset": 0 |
|
} |
|
], |
|
"md5sum": "466cef09e5f4201900768e4ffb19c0d5" |
|
}, |
|
{ |
|
"dataPath": "params_shard_194.bin", |
|
"format": "raw-shard", |
|
"nbytes": 1191936, |
|
"records": [ |
|
{ |
|
"name": "model.layers.0.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 0 |
|
}, |
|
{ |
|
"name": "model.layers.0.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 12288 |
|
}, |
|
{ |
|
"name": "model.layers.1.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 24576 |
|
}, |
|
{ |
|
"name": "model.layers.1.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 36864 |
|
}, |
|
{ |
|
"name": "model.layers.2.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 49152 |
|
}, |
|
{ |
|
"name": "model.layers.2.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 61440 |
|
}, |
|
{ |
|
"name": "model.layers.10.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 73728 |
|
}, |
|
{ |
|
"name": "model.layers.10.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 86016 |
|
}, |
|
{ |
|
"name": "model.layers.8.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 98304 |
|
}, |
|
{ |
|
"name": "model.layers.8.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 110592 |
|
}, |
|
{ |
|
"name": "model.layers.9.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 122880 |
|
}, |
|
{ |
|
"name": "model.layers.9.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 135168 |
|
}, |
|
{ |
|
"name": "model.layers.11.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 147456 |
|
}, |
|
{ |
|
"name": "model.layers.11.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 159744 |
|
}, |
|
{ |
|
"name": "model.layers.12.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 172032 |
|
}, |
|
{ |
|
"name": "model.layers.12.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 184320 |
|
}, |
|
{ |
|
"name": "model.layers.13.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 196608 |
|
}, |
|
{ |
|
"name": "model.layers.13.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 208896 |
|
}, |
|
{ |
|
"name": "model.layers.14.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 221184 |
|
}, |
|
{ |
|
"name": "model.layers.14.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 233472 |
|
}, |
|
{ |
|
"name": "model.layers.15.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 245760 |
|
}, |
|
{ |
|
"name": "model.layers.15.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 258048 |
|
}, |
|
{ |
|
"name": "model.layers.16.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 270336 |
|
}, |
|
{ |
|
"name": "model.layers.16.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 282624 |
|
}, |
|
{ |
|
"name": "model.layers.17.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 294912 |
|
}, |
|
{ |
|
"name": "model.layers.17.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 307200 |
|
}, |
|
{ |
|
"name": "model.layers.18.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 319488 |
|
}, |
|
{ |
|
"name": "model.layers.18.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 331776 |
|
}, |
|
{ |
|
"name": "model.layers.19.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 344064 |
|
}, |
|
{ |
|
"name": "model.layers.19.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 356352 |
|
}, |
|
{ |
|
"name": "model.layers.20.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 368640 |
|
}, |
|
{ |
|
"name": "model.layers.20.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 380928 |
|
}, |
|
{ |
|
"name": "model.layers.21.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 393216 |
|
}, |
|
{ |
|
"name": "model.layers.21.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 405504 |
|
}, |
|
{ |
|
"name": "model.layers.22.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 417792 |
|
}, |
|
{ |
|
"name": "model.layers.22.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 430080 |
|
}, |
|
{ |
|
"name": "model.layers.23.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 442368 |
|
}, |
|
{ |
|
"name": "model.layers.23.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 454656 |
|
}, |
|
{ |
|
"name": "model.layers.24.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 466944 |
|
}, |
|
{ |
|
"name": "model.layers.24.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 479232 |
|
}, |
|
{ |
|
"name": "model.layers.25.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 491520 |
|
}, |
|
{ |
|
"name": "model.layers.25.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 503808 |
|
}, |
|
{ |
|
"name": "model.layers.26.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 516096 |
|
}, |
|
{ |
|
"name": "model.layers.26.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 528384 |
|
}, |
|
{ |
|
"name": "model.layers.27.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 540672 |
|
}, |
|
{ |
|
"name": "model.layers.27.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 552960 |
|
}, |
|
{ |
|
"name": "model.layers.28.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 565248 |
|
}, |
|
{ |
|
"name": "model.layers.28.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 577536 |
|
}, |
|
{ |
|
"name": "model.layers.29.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 589824 |
|
}, |
|
{ |
|
"name": "model.layers.29.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 602112 |
|
}, |
|
{ |
|
"name": "model.layers.30.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 614400 |
|
}, |
|
{ |
|
"name": "model.layers.30.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 626688 |
|
}, |
|
{ |
|
"name": "model.layers.3.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 638976 |
|
}, |
|
{ |
|
"name": "model.layers.3.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 651264 |
|
}, |
|
{ |
|
"name": "model.layers.4.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 663552 |
|
}, |
|
{ |
|
"name": "model.layers.4.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 675840 |
|
}, |
|
{ |
|
"name": "model.layers.5.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 688128 |
|
}, |
|
{ |
|
"name": "model.layers.5.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 700416 |
|
}, |
|
{ |
|
"name": "model.layers.31.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 712704 |
|
}, |
|
{ |
|
"name": "model.layers.31.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 724992 |
|
}, |
|
{ |
|
"name": "model.layers.32.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 737280 |
|
}, |
|
{ |
|
"name": "model.layers.32.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 749568 |
|
}, |
|
{ |
|
"name": "model.layers.33.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 761856 |
|
}, |
|
{ |
|
"name": "model.layers.33.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 774144 |
|
}, |
|
{ |
|
"name": "model.layers.34.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 786432 |
|
}, |
|
{ |
|
"name": "model.layers.34.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 798720 |
|
}, |
|
{ |
|
"name": "model.layers.35.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 811008 |
|
}, |
|
{ |
|
"name": "model.layers.35.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 823296 |
|
}, |
|
{ |
|
"name": "model.layers.36.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 835584 |
|
}, |
|
{ |
|
"name": "model.layers.36.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 847872 |
|
}, |
|
{ |
|
"name": "model.layers.37.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 860160 |
|
}, |
|
{ |
|
"name": "model.layers.37.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 872448 |
|
}, |
|
{ |
|
"name": "model.layers.38.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 884736 |
|
}, |
|
{ |
|
"name": "model.layers.38.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 897024 |
|
}, |
|
{ |
|
"name": "model.layers.39.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 909312 |
|
}, |
|
{ |
|
"name": "model.layers.39.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 921600 |
|
}, |
|
{ |
|
"name": "model.layers.40.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 933888 |
|
}, |
|
{ |
|
"name": "model.layers.40.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 946176 |
|
}, |
|
{ |
|
"name": "model.layers.41.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 958464 |
|
}, |
|
{ |
|
"name": "model.layers.41.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 970752 |
|
}, |
|
{ |
|
"name": "model.layers.42.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 983040 |
|
}, |
|
{ |
|
"name": "model.layers.42.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 995328 |
|
}, |
|
{ |
|
"name": "model.layers.43.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1007616 |
|
}, |
|
{ |
|
"name": "model.layers.43.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1019904 |
|
}, |
|
{ |
|
"name": "model.layers.44.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1032192 |
|
}, |
|
{ |
|
"name": "model.layers.44.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1044480 |
|
}, |
|
{ |
|
"name": "model.layers.45.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1056768 |
|
}, |
|
{ |
|
"name": "model.layers.45.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1069056 |
|
}, |
|
{ |
|
"name": "model.layers.46.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1081344 |
|
}, |
|
{ |
|
"name": "model.layers.46.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1093632 |
|
}, |
|
{ |
|
"name": "model.layers.47.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1105920 |
|
}, |
|
{ |
|
"name": "model.layers.47.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1118208 |
|
}, |
|
{ |
|
"name": "model.norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1130496 |
|
}, |
|
{ |
|
"name": "model.layers.6.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1142784 |
|
}, |
|
{ |
|
"name": "model.layers.6.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1155072 |
|
}, |
|
{ |
|
"name": "model.layers.7.attention_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1167360 |
|
}, |
|
{ |
|
"name": "model.layers.7.ffn_norm.weight", |
|
"shape": [ |
|
6144 |
|
], |
|
"dtype": "float16", |
|
"format": "f32-to-bf16", |
|
"nbytes": 12288, |
|
"byteOffset": 1179648 |
|
} |
|
], |
|
"md5sum": "80e313b0363be60fb7c8c56c2175d304" |
|
} |
|
] |
|
} |