diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7d7158c68969a4e096402d60e6d8c31cfb25e012 --- /dev/null +++ b/config.json @@ -0,0 +1,23 @@ +{ + "_name_or_path": "sharpbai/vicuna-13b-v1.3", + "architectures": [ + "LlamaForCausalLM" + ], + "bos_token_id": 1, + "eos_token_id": 2, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "intermediate_size": 13824, + "max_position_embeddings": 2048, + "model_type": "llama", + "num_attention_heads": 40, + "num_hidden_layers": 40, + "pad_token_id": 0, + "rms_norm_eps": 1e-06, + "tie_word_embeddings": false, + "torch_dtype": "float16", + "transformers_version": "4.30.1", + "use_cache": false, + "vocab_size": 32000 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3076ca9866acf30d52b086b96af98a85c17015c0 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,7 @@ +{ + "_from_model_config": true, + "bos_token_id": 1, + "eos_token_id": 2, + "pad_token_id": 0, + "transformers_version": "4.30.1" +} diff --git a/pytorch_model-00001-of-00082.bin b/pytorch_model-00001-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..17abe0141bf09c2e486de1bff12116fc8d5711ba --- /dev/null +++ b/pytorch_model-00001-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdcefd7500d16d6c8e6affeff931bff282a25e2bd42ee3dddf6fd67607a11d4b +size 380110075 diff --git a/pytorch_model-00002-of-00082.bin b/pytorch_model-00002-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8532836f68e9f8cb875bc191927db488c481be96 --- /dev/null +++ b/pytorch_model-00002-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0c52eca8f3910c0bc3718a61a3e017b3e513ae632d6e005815ea3163697118a +size 298846638 diff --git a/pytorch_model-00003-of-00082.bin b/pytorch_model-00003-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d5516837919eb4e391ff84a6a7199878027cf316 --- /dev/null +++ b/pytorch_model-00003-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ca31b86e45e02f3099180851158ea2e97855a35fe1a776150540a75ab07ff2 +size 387996095 diff --git a/pytorch_model-00004-of-00082.bin b/pytorch_model-00004-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4630b148f8155848711fd4f1547c9d1c8c801a13 --- /dev/null +++ b/pytorch_model-00004-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1374f390196f785b2456d6ecf70a938b741d5ba2ec4daef239d9e2db1c6b78f2 +size 387975598 diff --git a/pytorch_model-00005-of-00082.bin b/pytorch_model-00005-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..62d1a6eb8b0d56d8858e67fc81008da82e209a34 --- /dev/null +++ b/pytorch_model-00005-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84df7ddab1f1b5252205186c29ea5f9f14f532fb0ab4f42d9ea5779057ce386c +size 351296801 diff --git a/pytorch_model-00006-of-00082.bin b/pytorch_model-00006-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1d0e51c23c6f3d91a1910bc88909bac3806cd7a3 --- /dev/null +++ b/pytorch_model-00006-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f07e35400fabcd7492c93e172f1d637cedb3f51f07a19ec79e41fdd0d8e3a493 +size 283116795 diff --git a/pytorch_model-00007-of-00082.bin b/pytorch_model-00007-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c633477d0e3d04d2dbb083b6aed1406d35cd6514 --- /dev/null +++ b/pytorch_model-00007-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9363d6f4b990a62568e1fb99d1eb830aada592e76f9a2f0cc98e9f195fa48e4 +size 351296801 diff --git a/pytorch_model-00008-of-00082.bin b/pytorch_model-00008-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..891a0f9b1a41068f6282ded41246efc451fea98d --- /dev/null +++ b/pytorch_model-00008-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35d1f5596376d06ebc80945dfc1ba9336bedc4b5efc561f06de084d665393dfb +size 283116795 diff --git a/pytorch_model-00009-of-00082.bin b/pytorch_model-00009-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..460a3b9820511a31f5cd3b621368d4538cc9e8ba --- /dev/null +++ b/pytorch_model-00009-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e796292b1de691c30c1c4479bafa3821ef423e460eff97de2bb459af63b714c +size 351296801 diff --git a/pytorch_model-00010-of-00082.bin b/pytorch_model-00010-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e04de7a6ea3a96bdd1c64ab34ff0cec704520541 --- /dev/null +++ b/pytorch_model-00010-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d1d383e1c2e30be8ac251f0831725066d11c4d52aeead0ffb6a9c930886d56 +size 283116795 diff --git a/pytorch_model-00011-of-00082.bin b/pytorch_model-00011-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5a89a0932877bc726039f1f725370a4a7885290d --- /dev/null +++ b/pytorch_model-00011-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02df655a58b4b410e0bf0016e41b97251108d8cb825f0c6da4cdc33fbd150858 +size 351296801 diff --git a/pytorch_model-00012-of-00082.bin b/pytorch_model-00012-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c231e6b6d53399d6bfefd9c15c7570bb3d6aa622 --- /dev/null +++ b/pytorch_model-00012-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b57be10b11d8435a8e5cee7e202e65a04e3c93c35e42515a4c24bf53b123af +size 283116795 diff --git a/pytorch_model-00013-of-00082.bin b/pytorch_model-00013-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3f8ff0e6b7b006ff83f71b85edbf5c3014d63b5 --- /dev/null +++ b/pytorch_model-00013-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08522cf1ad51131187dfe6fe58551dfe5af446c04356a598adb28ef482e2a6e +size 351296801 diff --git a/pytorch_model-00014-of-00082.bin b/pytorch_model-00014-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..95e70504e1616a77742e960669eaf1eef6359a0d --- /dev/null +++ b/pytorch_model-00014-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf596a1e659a73218f96c20698971ae90ae77d050c2bf8d2fcc89d3d007810a +size 283116795 diff --git a/pytorch_model-00015-of-00082.bin b/pytorch_model-00015-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..112e07bf441761952b2b50ae2924a90a77fbde13 --- /dev/null +++ b/pytorch_model-00015-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a655fb30e431c05e197fb6825c85052febdb1bf3180cc77ba3eaa218b544897c +size 351296801 diff --git a/pytorch_model-00016-of-00082.bin b/pytorch_model-00016-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..04f7d51a2d1bf410859560d8c44686c59abe24b7 --- /dev/null +++ b/pytorch_model-00016-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e9e4dfe45b5c63dc9fba9936053af0b64d8d5caa3832fc8dfffe76dd0588682 +size 283116795 diff --git a/pytorch_model-00017-of-00082.bin b/pytorch_model-00017-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..83ba53ebdcc5774e68a973a8eab513173a18d753 --- /dev/null +++ b/pytorch_model-00017-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92b5d2d9679954a805a7fdbbadcb717fda0809ece4d5ff897c7e42cb6ab3fd7e +size 351296801 diff --git a/pytorch_model-00018-of-00082.bin b/pytorch_model-00018-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1e6d6113504e101c5184dd1e98594da7c6ca8fd --- /dev/null +++ b/pytorch_model-00018-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ff68087f8c5c9dc72b98eb33deffd645bd4bac8ee5510fa6d9f7281c788da36 +size 283116795 diff --git a/pytorch_model-00019-of-00082.bin b/pytorch_model-00019-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..58aaa67eef704585251b6266b07322c45a994bd5 --- /dev/null +++ b/pytorch_model-00019-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2c94ee8c38f655ebcb1f9175e7741b71664da84400a34ed841eb96f02d60d6 +size 351296801 diff --git a/pytorch_model-00020-of-00082.bin b/pytorch_model-00020-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..675a677da46e4be17ffbf455e5aec773874702d4 --- /dev/null +++ b/pytorch_model-00020-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc62bbfb6277aa6ed79a5cc1702a099902f5a932dfebea20a194a503eb767a75 +size 283116795 diff --git a/pytorch_model-00021-of-00082.bin b/pytorch_model-00021-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b04405cc824ceef2c512ca91c78d94f6897dda64 --- /dev/null +++ b/pytorch_model-00021-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b136094e310eb7842796b6a16dff73e19dfb502e92212178a97bd2ae1964e01 +size 351296865 diff --git a/pytorch_model-00022-of-00082.bin b/pytorch_model-00022-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..50957e59ec873e9c90176ce74fbc4476cc2ff693 --- /dev/null +++ b/pytorch_model-00022-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ba1bddcfe45574dee0572db54fbbf727326e17f21c760a8d738d9469c9c02d7 +size 283116795 diff --git a/pytorch_model-00023-of-00082.bin b/pytorch_model-00023-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bb64b6456ead23105b7899e712010758abf4652 --- /dev/null +++ b/pytorch_model-00023-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d369076497348c6c279532c90ed2a4dd907e06a2c58d0a1ae22e6e44551b3784 +size 351296865 diff --git a/pytorch_model-00024-of-00082.bin b/pytorch_model-00024-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..83c432ff8c98c923ac26ce1c36e0af6c63e5866f --- /dev/null +++ b/pytorch_model-00024-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:838996414b4c2c14e6ce5c938493af0bd9e59e47d6234a9a74768c3d19251928 +size 283116795 diff --git a/pytorch_model-00025-of-00082.bin b/pytorch_model-00025-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5348ec3ec4bfd39072c56d24191e9033ad79b9b9 --- /dev/null +++ b/pytorch_model-00025-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da9122eb8067b1b7d679ce0126dbde4ef2339ceeeaf586d9986295b459892bb +size 351296865 diff --git a/pytorch_model-00026-of-00082.bin b/pytorch_model-00026-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d52e547e0e68329e93f41eeb0e9a3bfb7565f528 --- /dev/null +++ b/pytorch_model-00026-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c436db99143d9cd5a75a2b35fcdf89874a886bfef46da614ec28ff733c426e41 +size 283116795 diff --git a/pytorch_model-00027-of-00082.bin b/pytorch_model-00027-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d04c1cd499df78e19f348800339743c7fedeba03 --- /dev/null +++ b/pytorch_model-00027-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95316b4523347577a57d913162586d864d1148cdb0be01287104acfbae1b3e47 +size 351296865 diff --git a/pytorch_model-00028-of-00082.bin b/pytorch_model-00028-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..9353f0c2edea09de7b0744e0f13cc4b366973ee6 --- /dev/null +++ b/pytorch_model-00028-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4fed2868780d0f5f944b4671587a74fd85887e5b7e333610b8e0901493d3cf2 +size 283116795 diff --git a/pytorch_model-00029-of-00082.bin b/pytorch_model-00029-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2071ed0f5e781c409718753285bf7630a466f21 --- /dev/null +++ b/pytorch_model-00029-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:791ebce20764e1fa0197950673765f9012d63f0f44bfd025e9cf9cf076dd09bd +size 351296865 diff --git a/pytorch_model-00030-of-00082.bin b/pytorch_model-00030-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac9be700fb885e9ce7242264e1f55a727b7f0d28 --- /dev/null +++ b/pytorch_model-00030-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94bf43baa4f395d879afc2cffbaaa26f22e4a0a9cc1349f2c47ddb80bb334677 +size 283116795 diff --git a/pytorch_model-00031-of-00082.bin b/pytorch_model-00031-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..57560e773de0979fad1ddf7f94d305ed71127225 --- /dev/null +++ b/pytorch_model-00031-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b132e27dd4a112e2daf8dae2589e85079862d031437c4445fcefd103e46edaea +size 351296865 diff --git a/pytorch_model-00032-of-00082.bin b/pytorch_model-00032-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ce9641826319a93afca2397c5b4d5b5923046676 --- /dev/null +++ b/pytorch_model-00032-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7de09b5c222e43bd9adf5dc2f9e713094f18bb473d63c18a850f62940c0dad +size 283116795 diff --git a/pytorch_model-00033-of-00082.bin b/pytorch_model-00033-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1070c0cc420aa2045b3fcf80167b01588bdd93f --- /dev/null +++ b/pytorch_model-00033-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c3dea208b58898d6df8f482bea5d6d04a8a6d938353164df585ae541bdfcb4 +size 351296865 diff --git a/pytorch_model-00034-of-00082.bin b/pytorch_model-00034-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d930d4bab057e74ecb323ab4e2b470f2a54f4dda --- /dev/null +++ b/pytorch_model-00034-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc53ffb1bf2255077da368e7ee66b8fca50a458e8f1456c6478332323284156 +size 283116795 diff --git a/pytorch_model-00035-of-00082.bin b/pytorch_model-00035-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..36dd580462d7e37f3454eb6c1df0c0d4f5842411 --- /dev/null +++ b/pytorch_model-00035-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:218ae9a49b73a32716950e468f1eb7079b2995729820085dded062eb750bd016 +size 351296865 diff --git a/pytorch_model-00036-of-00082.bin b/pytorch_model-00036-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..12c9ae04e699c3301df12bedf07c2c412f34389f --- /dev/null +++ b/pytorch_model-00036-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:787bb254d3940248b719ab80b59b16139023c8d55e9576d1eb88cf3099138c69 +size 283116795 diff --git a/pytorch_model-00037-of-00082.bin b/pytorch_model-00037-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2f2a8acc8d1c64b91a015b9e0d1a5222c614484 --- /dev/null +++ b/pytorch_model-00037-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75140bc3778cc9ec170d2920a1727440668b16519ca0429c6f44cc9005d34b6 +size 351296865 diff --git a/pytorch_model-00038-of-00082.bin b/pytorch_model-00038-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3af1cc377a6e33098aeee1816c5849cc1bb5830e --- /dev/null +++ b/pytorch_model-00038-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09acd14f600b7f030a3bc0f22fa8a3d5f0a45d178a8ad54c2879ee90c50d14a2 +size 283116795 diff --git a/pytorch_model-00039-of-00082.bin b/pytorch_model-00039-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..79fdd89b2eadeb11356400c5425e38e52d17be0b --- /dev/null +++ b/pytorch_model-00039-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd10a40e9b9875f69355192fce42b0448dffb644f8aa466e6fdb755dce821f8 +size 351296865 diff --git a/pytorch_model-00040-of-00082.bin b/pytorch_model-00040-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..19fc1bc49c049fc7efc153c6a6ec893900cb1da0 --- /dev/null +++ b/pytorch_model-00040-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:847eacea67bbdedaa70ef0716f77c506052d3101d659ba4f635f26a72a1aad93 +size 283116795 diff --git a/pytorch_model-00041-of-00082.bin b/pytorch_model-00041-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7a1adb9f2e8ccd29c9c91cb8bf5a4e63829903e --- /dev/null +++ b/pytorch_model-00041-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc2d5289cb414c5efa9b3f394415437b8d2653a318f36eec8653248bfd5f1e05 +size 351296865 diff --git a/pytorch_model-00042-of-00082.bin b/pytorch_model-00042-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0c2108b23ae619c7779d8faeaebbab81f94aed7 --- /dev/null +++ b/pytorch_model-00042-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ee77d8b11534455d4e3a6916f3fda6990593cecffedc9b8e7939139f8c2bcc2 +size 283116795 diff --git a/pytorch_model-00043-of-00082.bin b/pytorch_model-00043-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d82a0fe9a4c993c956ac4f00561376d7dea5b5f9 --- /dev/null +++ b/pytorch_model-00043-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2952419fc7561bf5e8e820ed0a97e6354a5e661778f500e4d10324a4a73abf2 +size 351296865 diff --git a/pytorch_model-00044-of-00082.bin b/pytorch_model-00044-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3e461d599fb8ea64808be84efcafe0e4beab9913 --- /dev/null +++ b/pytorch_model-00044-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba555138025fd8d9c44cfa6b730b5c939135337986dd7b95ec81cf508ce90703 +size 283116795 diff --git a/pytorch_model-00045-of-00082.bin b/pytorch_model-00045-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f8c34b2142f6d2e14b4f2fbfb1214068f8f637d --- /dev/null +++ b/pytorch_model-00045-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408b3b29f5ba0fe9c58290fb5f7116f93b0bc8b76226751d5af7852fcc41faed +size 351296865 diff --git a/pytorch_model-00046-of-00082.bin b/pytorch_model-00046-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5351c7e979f10259f68a58990df402871ac5b580 --- /dev/null +++ b/pytorch_model-00046-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c79d79a702c43bfa58f5dc649d0ae80597f0c1fcfe53b1326ac04a9e667f34 +size 283116795 diff --git a/pytorch_model-00047-of-00082.bin b/pytorch_model-00047-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c654eb94a97eaa072c6e85b3f2b8b2fc8d9d3aa5 --- /dev/null +++ b/pytorch_model-00047-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9cd56036fcd866d8b5827b08862c4cdc92d33c3d99105edb378ec3f88ca3a9a +size 351296865 diff --git a/pytorch_model-00048-of-00082.bin b/pytorch_model-00048-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..157ee110a150cf7319c8a41044d6ebd7ad7d2a0e --- /dev/null +++ b/pytorch_model-00048-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd659768e948c6b202bd9f813776c15618eb5a31280ce1486b077da436a1e798 +size 283116795 diff --git a/pytorch_model-00049-of-00082.bin b/pytorch_model-00049-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c127a2fd41b7a14632fe874b68966851310532c7 --- /dev/null +++ b/pytorch_model-00049-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221e04a59e8db07aef9c11443320427cf6822b224aaad392d066ef7adb4be951 +size 351296865 diff --git a/pytorch_model-00050-of-00082.bin b/pytorch_model-00050-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..a7f02f8897cd3afcbcae7ad2e46f7f18238e047f --- /dev/null +++ b/pytorch_model-00050-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ae57f4e0a67326769a9772b52ccd350a54bb68e3c367e84a9e1c9a23aef2b05 +size 283116795 diff --git a/pytorch_model-00051-of-00082.bin b/pytorch_model-00051-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4df74601ae4686663d19a5eed96baf9ae6a3ea1f --- /dev/null +++ b/pytorch_model-00051-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45ce6714b95fb60b2a0093d8a92727e712d44240994c425e9b83d923a7329d29 +size 351296865 diff --git a/pytorch_model-00052-of-00082.bin b/pytorch_model-00052-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b03d6ddad9775ba3d21c3ec2da61488e2d1df058 --- /dev/null +++ b/pytorch_model-00052-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f37ddced9c4a553d4532347c0f7249cdcbb253847cd96a4f7f1d588f59631b91 +size 283116795 diff --git a/pytorch_model-00053-of-00082.bin b/pytorch_model-00053-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c96b2d18ec5c37f7f7ff2da4fdf43eaff8a346eb --- /dev/null +++ b/pytorch_model-00053-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2800baf2bef7fec21959a748909b129a480c8c1606d8208fdf1ce224efd5d782 +size 351296865 diff --git a/pytorch_model-00054-of-00082.bin b/pytorch_model-00054-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..381603dbd3c9923c437f23827bb1beb20f98dadf --- /dev/null +++ b/pytorch_model-00054-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3f5b39f4ea47d0a3d416522195bcbdf027a57a46e3dfa14eaea97a53fd0133 +size 283116795 diff --git a/pytorch_model-00055-of-00082.bin b/pytorch_model-00055-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1527491d466ee3fe4c2e9ab9363a49fc77c3881 --- /dev/null +++ b/pytorch_model-00055-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3273484d9b051aac2e0c6c1ebde80e3db8e68ee1e21a617599471d7522e852f1 +size 351296865 diff --git a/pytorch_model-00056-of-00082.bin b/pytorch_model-00056-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..17387ce75d1be4208dc9af9b0c20c59551f31d07 --- /dev/null +++ b/pytorch_model-00056-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86f7545bc30f47eaf92fa8dbac625f64aa40ef6257ef2c8cc535dedc00965c42 +size 283116795 diff --git a/pytorch_model-00057-of-00082.bin b/pytorch_model-00057-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea92928a33de9e2c1937ac93703bff947aa6efb5 --- /dev/null +++ b/pytorch_model-00057-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b846be3018a28e00a67e48e0a4602a493dd221ae5c17802ed9d2669df7a0b1 +size 351296865 diff --git a/pytorch_model-00058-of-00082.bin b/pytorch_model-00058-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6581a794cb4d2566e4f1c5f32f0c2ddc1377b38 --- /dev/null +++ b/pytorch_model-00058-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:253abe7bec9a7a61b1b06da21d9f03f33f9046961942a19479f6e0eab74d1974 +size 283116795 diff --git a/pytorch_model-00059-of-00082.bin b/pytorch_model-00059-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7cffe201c584088321122fb696845b8ae878e25 --- /dev/null +++ b/pytorch_model-00059-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b314947bf48302f03ba2f5386a3a17e591ab2d2e9dbe131d39e4cd0dde24582b +size 351296865 diff --git a/pytorch_model-00060-of-00082.bin b/pytorch_model-00060-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1087990551c6af3cd22466ac38453fd7db3caf1b --- /dev/null +++ b/pytorch_model-00060-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36663d45fa24b90a1c382479053dc10551ce3a9d2a3ee44f5c55352d93e8fd4e +size 283116795 diff --git a/pytorch_model-00061-of-00082.bin b/pytorch_model-00061-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c495da7e127834e467f845d5bbd934733d1efeb --- /dev/null +++ b/pytorch_model-00061-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd11bdc66b933671f67953e2c6875eca3cf43f229fb2342f3cbfd02cbbb6f8fe +size 351296865 diff --git a/pytorch_model-00062-of-00082.bin b/pytorch_model-00062-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..dc37064333345dab5c20df3a4997ddac31b76368 --- /dev/null +++ b/pytorch_model-00062-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac13d11001db29da0db05c243d288b9b77236a583e92d007512417537e45285 +size 283116795 diff --git a/pytorch_model-00063-of-00082.bin b/pytorch_model-00063-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f423e55de9405645d3733c654eee9b6d52bf4bc8 --- /dev/null +++ b/pytorch_model-00063-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c6f5ac5cb2de4f160f747c678c3ca1b4aabc0618a211ee2c2471e87045e5e8a +size 351296865 diff --git a/pytorch_model-00064-of-00082.bin b/pytorch_model-00064-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..41550bb55ef181658fd14a33711b1b761035c583 --- /dev/null +++ b/pytorch_model-00064-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ee9cc812b9c4d19d61224464347b47008e05bb6efd78aadd8c97f6e3787724 +size 283116795 diff --git a/pytorch_model-00065-of-00082.bin b/pytorch_model-00065-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4ea1a8c28a88741775b1d6a606b3b48f8c6a9717 --- /dev/null +++ b/pytorch_model-00065-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:418c4b9d44adc9acb323f7d702d9c1117eb47144bfcc91c4856a580ebefb4110 +size 351296865 diff --git a/pytorch_model-00066-of-00082.bin b/pytorch_model-00066-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b1a0141acf441c70f368ad5c1de78ddb27c12ed --- /dev/null +++ b/pytorch_model-00066-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265cd7f05fb11f5c47b83bcfdb5b9d2cb2d45dd44a77e55aebeec5d111bde636 +size 283116795 diff --git a/pytorch_model-00067-of-00082.bin b/pytorch_model-00067-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc92bad4c4fcf2e813bb29b955158714e1bc168b --- /dev/null +++ b/pytorch_model-00067-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd14c49dcb1899e91664cb7bce9525c6348809236fc2796d7c7f30060036362 +size 351296865 diff --git a/pytorch_model-00068-of-00082.bin b/pytorch_model-00068-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..46dd3fac6763bcf51318063cae4177e6dd276321 --- /dev/null +++ b/pytorch_model-00068-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ca2027e73a8bf0b285f762b9880feb075c5554eff5122d2bc180e8b01f3dc2 +size 283116795 diff --git a/pytorch_model-00069-of-00082.bin b/pytorch_model-00069-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..806ea735c7dfcdac198cc0d5550c382b3f8f1923 --- /dev/null +++ b/pytorch_model-00069-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f3f1b20c464fd78a93a24beacde8e6aa6c974362ab0298dca6575cd85318df +size 351296865 diff --git a/pytorch_model-00070-of-00082.bin b/pytorch_model-00070-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d53054b88b1b1c209b8039f2e5e11a7c7deeeb64 --- /dev/null +++ b/pytorch_model-00070-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39f4fb843091652c0755ee1e21881f6722366231895542b5f3ef0507c1eb53e +size 283116795 diff --git a/pytorch_model-00071-of-00082.bin b/pytorch_model-00071-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..962e8a61c3a89a076c779111f9f55f8eb541868d --- /dev/null +++ b/pytorch_model-00071-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:530ea21eb213e8ed4908cf496a56987e01c7c93a4063283ab05bd600900bbd56 +size 351296865 diff --git a/pytorch_model-00072-of-00082.bin b/pytorch_model-00072-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..bfbe38766b0acded7b666056e0cac2b222a394aa --- /dev/null +++ b/pytorch_model-00072-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ea1d4db4ad62796323295338bd2cf257838a0d248a0d6afff5a1dd3afb4963 +size 283116795 diff --git a/pytorch_model-00073-of-00082.bin b/pytorch_model-00073-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..9ca3814a4ae94dd32901752a3654799a2050720c --- /dev/null +++ b/pytorch_model-00073-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2114aadcb7844051bda6a0dee5bc031016dfb8e0c6d0ccbc24c048b467f6510 +size 351296865 diff --git a/pytorch_model-00074-of-00082.bin b/pytorch_model-00074-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..6f876fd5007b7026b86d1ca861d864c1245b42d8 --- /dev/null +++ b/pytorch_model-00074-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd9fab788709e102c547ccb9370db7aa198f9af3b08e1bedf73d235126caa9b +size 283116795 diff --git a/pytorch_model-00075-of-00082.bin b/pytorch_model-00075-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f05cb914550e4eb263972bdb753b228c00666d1f --- /dev/null +++ b/pytorch_model-00075-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd7eb9cd1a7ce8f529a30c9524b374dcb8713cb6242e624ef9708d3ec0243e3 +size 351296865 diff --git a/pytorch_model-00076-of-00082.bin b/pytorch_model-00076-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..15181f1242e7dc09ec6a065f6208433a50c11660 --- /dev/null +++ b/pytorch_model-00076-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d09ed9040d7e25236ce323d69b3659be61f926835915b959f30a8fe9b35841 +size 283116795 diff --git a/pytorch_model-00077-of-00082.bin b/pytorch_model-00077-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..23dff3df5237bf3f012f2e74df6f11fe7fd3d5a4 --- /dev/null +++ b/pytorch_model-00077-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e8912b8f19a4f0379a94ce7459319faf416f4c76048ed5df6b92da5801180f +size 351296865 diff --git a/pytorch_model-00078-of-00082.bin b/pytorch_model-00078-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..29320bc449a6e27cbf5115d12677b2c0dddf62d2 --- /dev/null +++ b/pytorch_model-00078-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0126e43e4447e4d638addaa78c33ebcd5ab6712c82cf9193a28424f297ff245 +size 283116795 diff --git a/pytorch_model-00079-of-00082.bin b/pytorch_model-00079-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1099b496f67f7f6d10b1ac300d3794187a24035c --- /dev/null +++ b/pytorch_model-00079-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:826e3521d96c7ee3eeef25078aeb7263d3b424d65eaf7d5dbc7d5a04222a0c6d +size 351296865 diff --git a/pytorch_model-00080-of-00082.bin b/pytorch_model-00080-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3229752b7c463037ef54baee8bc4416c2747f48e --- /dev/null +++ b/pytorch_model-00080-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e372c51fd95267d3292c28c2147a1eba112e05212b2dd4fb1fdbec2becdfc58a +size 283116795 diff --git a/pytorch_model-00081-of-00082.bin b/pytorch_model-00081-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd6d58769f845b1fec3cd87b0f1b92cdc59ee5f3 --- /dev/null +++ b/pytorch_model-00081-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b5f6bb2951dec89dd99220d22ec04a73e93d1a85ce5852bff76e5d15cc71c5f +size 141590301 diff --git a/pytorch_model-00082-of-00082.bin b/pytorch_model-00082-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3630e76a8f1562c79387eef55b0ef9eda547b9a --- /dev/null +++ b/pytorch_model-00082-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d126afe074784330a7a820117a8449d18c333efb555bd995bd0cdab67381b4 +size 327680938 diff --git a/pytorch_model.bin.index.json b/pytorch_model.bin.index.json new file mode 100644 index 0000000000000000000000000000000000000000..e684cedb1a653453ef5bec1df2994064d057ee48 --- /dev/null +++ b/pytorch_model.bin.index.json @@ -0,0 +1,410 @@ +{ + "metadata": { + "total_size": 26031738880 + }, + "weight_map": { + "lm_head.weight": "pytorch_model-00082-of-00082.bin", + "model.embed_tokens.weight": "pytorch_model-00001-of-00082.bin", + "model.layers.0.input_layernorm.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.mlp.down_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.mlp.gate_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.mlp.up_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.post_attention_layernorm.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.self_attn.k_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.o_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.q_proj.weight": "pytorch_model-00001-of-00082.bin", + "model.layers.0.self_attn.rotary_emb.inv_freq": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.v_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.1.input_layernorm.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.mlp.down_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.mlp.gate_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.mlp.up_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.post_attention_layernorm.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.self_attn.k_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.1.self_attn.o_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.self_attn.q_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.1.self_attn.rotary_emb.inv_freq": "pytorch_model-00004-of-00082.bin", + "model.layers.1.self_attn.v_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.10.input_layernorm.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.mlp.down_proj.weight": "pytorch_model-00022-of-00082.bin", + "model.layers.10.mlp.gate_proj.weight": "pytorch_model-00022-of-00082.bin", + "model.layers.10.mlp.up_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.post_attention_layernorm.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.self_attn.k_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.o_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.q_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.rotary_emb.inv_freq": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.v_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.11.input_layernorm.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.mlp.down_proj.weight": "pytorch_model-00024-of-00082.bin", + "model.layers.11.mlp.gate_proj.weight": "pytorch_model-00024-of-00082.bin", + "model.layers.11.mlp.up_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.post_attention_layernorm.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.self_attn.k_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.o_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.q_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.rotary_emb.inv_freq": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.v_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.12.input_layernorm.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.mlp.down_proj.weight": "pytorch_model-00026-of-00082.bin", + "model.layers.12.mlp.gate_proj.weight": "pytorch_model-00026-of-00082.bin", + "model.layers.12.mlp.up_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.post_attention_layernorm.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.self_attn.k_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.o_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.q_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.rotary_emb.inv_freq": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.v_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.13.input_layernorm.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.mlp.down_proj.weight": "pytorch_model-00028-of-00082.bin", + "model.layers.13.mlp.gate_proj.weight": "pytorch_model-00028-of-00082.bin", + "model.layers.13.mlp.up_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.post_attention_layernorm.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.self_attn.k_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.o_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.q_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.rotary_emb.inv_freq": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.v_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.14.input_layernorm.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.mlp.down_proj.weight": "pytorch_model-00030-of-00082.bin", + "model.layers.14.mlp.gate_proj.weight": "pytorch_model-00030-of-00082.bin", + "model.layers.14.mlp.up_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.post_attention_layernorm.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.self_attn.k_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.o_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.q_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.rotary_emb.inv_freq": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.v_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.15.input_layernorm.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.mlp.down_proj.weight": "pytorch_model-00032-of-00082.bin", + "model.layers.15.mlp.gate_proj.weight": "pytorch_model-00032-of-00082.bin", + "model.layers.15.mlp.up_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.post_attention_layernorm.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.self_attn.k_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.o_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.q_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.rotary_emb.inv_freq": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.v_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.16.input_layernorm.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.mlp.down_proj.weight": "pytorch_model-00034-of-00082.bin", + "model.layers.16.mlp.gate_proj.weight": "pytorch_model-00034-of-00082.bin", + "model.layers.16.mlp.up_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.post_attention_layernorm.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.self_attn.k_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.o_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.q_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.rotary_emb.inv_freq": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.v_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.17.input_layernorm.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.mlp.down_proj.weight": "pytorch_model-00036-of-00082.bin", + "model.layers.17.mlp.gate_proj.weight": "pytorch_model-00036-of-00082.bin", + "model.layers.17.mlp.up_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.post_attention_layernorm.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.self_attn.k_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.o_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.q_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.rotary_emb.inv_freq": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.v_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.18.input_layernorm.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.mlp.down_proj.weight": "pytorch_model-00038-of-00082.bin", + "model.layers.18.mlp.gate_proj.weight": "pytorch_model-00038-of-00082.bin", + "model.layers.18.mlp.up_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.post_attention_layernorm.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.self_attn.k_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.o_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.q_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.rotary_emb.inv_freq": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.v_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.19.input_layernorm.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.mlp.down_proj.weight": "pytorch_model-00040-of-00082.bin", + "model.layers.19.mlp.gate_proj.weight": "pytorch_model-00040-of-00082.bin", + "model.layers.19.mlp.up_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.post_attention_layernorm.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.self_attn.k_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.o_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.q_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.rotary_emb.inv_freq": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.v_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.2.input_layernorm.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.mlp.down_proj.weight": "pytorch_model-00006-of-00082.bin", + "model.layers.2.mlp.gate_proj.weight": "pytorch_model-00006-of-00082.bin", + "model.layers.2.mlp.up_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.post_attention_layernorm.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.self_attn.k_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.o_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.q_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.rotary_emb.inv_freq": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.v_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.20.input_layernorm.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.mlp.down_proj.weight": "pytorch_model-00042-of-00082.bin", + "model.layers.20.mlp.gate_proj.weight": "pytorch_model-00042-of-00082.bin", + "model.layers.20.mlp.up_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.post_attention_layernorm.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.self_attn.k_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.o_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.q_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.rotary_emb.inv_freq": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.v_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.21.input_layernorm.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.mlp.down_proj.weight": "pytorch_model-00044-of-00082.bin", + "model.layers.21.mlp.gate_proj.weight": "pytorch_model-00044-of-00082.bin", + "model.layers.21.mlp.up_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.post_attention_layernorm.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.self_attn.k_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.o_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.q_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.rotary_emb.inv_freq": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.v_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.22.input_layernorm.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.mlp.down_proj.weight": "pytorch_model-00046-of-00082.bin", + "model.layers.22.mlp.gate_proj.weight": "pytorch_model-00046-of-00082.bin", + "model.layers.22.mlp.up_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.post_attention_layernorm.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.self_attn.k_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.o_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.q_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.rotary_emb.inv_freq": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.v_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.23.input_layernorm.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.mlp.down_proj.weight": "pytorch_model-00048-of-00082.bin", + "model.layers.23.mlp.gate_proj.weight": "pytorch_model-00048-of-00082.bin", + "model.layers.23.mlp.up_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.post_attention_layernorm.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.self_attn.k_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.o_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.q_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.rotary_emb.inv_freq": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.v_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.24.input_layernorm.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.mlp.down_proj.weight": "pytorch_model-00050-of-00082.bin", + "model.layers.24.mlp.gate_proj.weight": "pytorch_model-00050-of-00082.bin", + "model.layers.24.mlp.up_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.post_attention_layernorm.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.self_attn.k_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.o_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.q_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.rotary_emb.inv_freq": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.v_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.25.input_layernorm.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.mlp.down_proj.weight": "pytorch_model-00052-of-00082.bin", + "model.layers.25.mlp.gate_proj.weight": "pytorch_model-00052-of-00082.bin", + "model.layers.25.mlp.up_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.post_attention_layernorm.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.self_attn.k_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.o_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.q_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.rotary_emb.inv_freq": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.v_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.26.input_layernorm.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.mlp.down_proj.weight": "pytorch_model-00054-of-00082.bin", + "model.layers.26.mlp.gate_proj.weight": "pytorch_model-00054-of-00082.bin", + "model.layers.26.mlp.up_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.post_attention_layernorm.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.self_attn.k_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.o_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.q_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.rotary_emb.inv_freq": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.v_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.27.input_layernorm.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.mlp.down_proj.weight": "pytorch_model-00056-of-00082.bin", + "model.layers.27.mlp.gate_proj.weight": "pytorch_model-00056-of-00082.bin", + "model.layers.27.mlp.up_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.post_attention_layernorm.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.self_attn.k_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.o_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.q_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.rotary_emb.inv_freq": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.v_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.28.input_layernorm.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.mlp.down_proj.weight": "pytorch_model-00058-of-00082.bin", + "model.layers.28.mlp.gate_proj.weight": "pytorch_model-00058-of-00082.bin", + "model.layers.28.mlp.up_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.post_attention_layernorm.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.self_attn.k_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.o_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.q_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.rotary_emb.inv_freq": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.v_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.29.input_layernorm.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.mlp.down_proj.weight": "pytorch_model-00060-of-00082.bin", + "model.layers.29.mlp.gate_proj.weight": "pytorch_model-00060-of-00082.bin", + "model.layers.29.mlp.up_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.post_attention_layernorm.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.self_attn.k_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.o_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.q_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.rotary_emb.inv_freq": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.v_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.3.input_layernorm.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.mlp.down_proj.weight": "pytorch_model-00008-of-00082.bin", + "model.layers.3.mlp.gate_proj.weight": "pytorch_model-00008-of-00082.bin", + "model.layers.3.mlp.up_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.post_attention_layernorm.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.self_attn.k_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.o_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.q_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.rotary_emb.inv_freq": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.v_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.30.input_layernorm.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.mlp.down_proj.weight": "pytorch_model-00062-of-00082.bin", + "model.layers.30.mlp.gate_proj.weight": "pytorch_model-00062-of-00082.bin", + "model.layers.30.mlp.up_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.post_attention_layernorm.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.self_attn.k_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.o_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.q_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.rotary_emb.inv_freq": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.v_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.31.input_layernorm.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.mlp.down_proj.weight": "pytorch_model-00064-of-00082.bin", + "model.layers.31.mlp.gate_proj.weight": "pytorch_model-00064-of-00082.bin", + "model.layers.31.mlp.up_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.post_attention_layernorm.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.self_attn.k_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.o_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.q_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.rotary_emb.inv_freq": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.v_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.32.input_layernorm.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.mlp.down_proj.weight": "pytorch_model-00066-of-00082.bin", + "model.layers.32.mlp.gate_proj.weight": "pytorch_model-00066-of-00082.bin", + "model.layers.32.mlp.up_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.post_attention_layernorm.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.self_attn.k_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.o_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.q_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.rotary_emb.inv_freq": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.v_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.33.input_layernorm.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.mlp.down_proj.weight": "pytorch_model-00068-of-00082.bin", + "model.layers.33.mlp.gate_proj.weight": "pytorch_model-00068-of-00082.bin", + "model.layers.33.mlp.up_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.post_attention_layernorm.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.self_attn.k_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.o_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.q_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.rotary_emb.inv_freq": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.v_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.34.input_layernorm.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.mlp.down_proj.weight": "pytorch_model-00070-of-00082.bin", + "model.layers.34.mlp.gate_proj.weight": "pytorch_model-00070-of-00082.bin", + "model.layers.34.mlp.up_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.post_attention_layernorm.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.self_attn.k_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.o_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.q_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.rotary_emb.inv_freq": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.v_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.35.input_layernorm.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.mlp.down_proj.weight": "pytorch_model-00072-of-00082.bin", + "model.layers.35.mlp.gate_proj.weight": "pytorch_model-00072-of-00082.bin", + "model.layers.35.mlp.up_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.post_attention_layernorm.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.self_attn.k_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.o_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.q_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.rotary_emb.inv_freq": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.v_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.36.input_layernorm.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.mlp.down_proj.weight": "pytorch_model-00074-of-00082.bin", + "model.layers.36.mlp.gate_proj.weight": "pytorch_model-00074-of-00082.bin", + "model.layers.36.mlp.up_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.post_attention_layernorm.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.self_attn.k_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.o_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.q_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.rotary_emb.inv_freq": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.v_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.37.input_layernorm.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.mlp.down_proj.weight": "pytorch_model-00076-of-00082.bin", + "model.layers.37.mlp.gate_proj.weight": "pytorch_model-00076-of-00082.bin", + "model.layers.37.mlp.up_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.post_attention_layernorm.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.self_attn.k_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.o_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.q_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.rotary_emb.inv_freq": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.v_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.38.input_layernorm.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.mlp.down_proj.weight": "pytorch_model-00078-of-00082.bin", + "model.layers.38.mlp.gate_proj.weight": "pytorch_model-00078-of-00082.bin", + "model.layers.38.mlp.up_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.post_attention_layernorm.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.self_attn.k_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.o_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.q_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.rotary_emb.inv_freq": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.v_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.39.input_layernorm.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.mlp.down_proj.weight": "pytorch_model-00080-of-00082.bin", + "model.layers.39.mlp.gate_proj.weight": "pytorch_model-00080-of-00082.bin", + "model.layers.39.mlp.up_proj.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.post_attention_layernorm.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.self_attn.k_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.o_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.q_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.rotary_emb.inv_freq": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.v_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.4.input_layernorm.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.mlp.down_proj.weight": "pytorch_model-00010-of-00082.bin", + "model.layers.4.mlp.gate_proj.weight": "pytorch_model-00010-of-00082.bin", + "model.layers.4.mlp.up_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.post_attention_layernorm.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.self_attn.k_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.o_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.q_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.rotary_emb.inv_freq": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.v_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.5.input_layernorm.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.mlp.down_proj.weight": "pytorch_model-00012-of-00082.bin", + "model.layers.5.mlp.gate_proj.weight": "pytorch_model-00012-of-00082.bin", + "model.layers.5.mlp.up_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.post_attention_layernorm.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.self_attn.k_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.o_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.q_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.rotary_emb.inv_freq": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.v_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.6.input_layernorm.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.mlp.down_proj.weight": "pytorch_model-00014-of-00082.bin", + "model.layers.6.mlp.gate_proj.weight": "pytorch_model-00014-of-00082.bin", + "model.layers.6.mlp.up_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.post_attention_layernorm.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.self_attn.k_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.o_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.q_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.rotary_emb.inv_freq": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.v_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.7.input_layernorm.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.mlp.down_proj.weight": "pytorch_model-00016-of-00082.bin", + "model.layers.7.mlp.gate_proj.weight": "pytorch_model-00016-of-00082.bin", + "model.layers.7.mlp.up_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.post_attention_layernorm.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.self_attn.k_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.o_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.q_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.rotary_emb.inv_freq": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.v_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.8.input_layernorm.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.mlp.down_proj.weight": "pytorch_model-00018-of-00082.bin", + "model.layers.8.mlp.gate_proj.weight": "pytorch_model-00018-of-00082.bin", + "model.layers.8.mlp.up_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.post_attention_layernorm.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.self_attn.k_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.o_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.q_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.rotary_emb.inv_freq": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.v_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.9.input_layernorm.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.mlp.down_proj.weight": "pytorch_model-00020-of-00082.bin", + "model.layers.9.mlp.gate_proj.weight": "pytorch_model-00020-of-00082.bin", + "model.layers.9.mlp.up_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.post_attention_layernorm.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.self_attn.k_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.o_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.q_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.rotary_emb.inv_freq": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.v_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.norm.weight": "pytorch_model-00081-of-00082.bin" + } +}