diff --git a/config.json b/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..46c87c6c2d60780d6b0662fc2c2585983c8840a1
--- /dev/null
+++ b/config.json
@@ -0,0 +1,38 @@
+{
+ "_name_or_path": "Nemotron-4-340B-Instruct-hf",
+ "architectures": [
+ "NemotronForCausalLM"
+ ],
+ "attention_bias": false,
+ "attention_dropout": 0.0,
+ "bos_token_id": 2,
+ "eos_token_id": 3,
+ "head_dim": 192,
+ "hidden_act": "relu2",
+ "hidden_size": 18432,
+ "initializer_range": 0.0063,
+ "intermediate_size": 73728,
+ "max_position_embeddings": 4096,
+ "mlp_bias": false,
+ "model_type": "nemotron",
+ "norm_eps": 1e-05,
+ "num_attention_heads": 96,
+ "num_hidden_layers": 96,
+ "num_key_value_heads": 8,
+ "quantization_config": {
+ "activation_scheme": "dynamic",
+ "ignored_layers": [
+ "lm_head"
+ ],
+ "quant_method": "fp8"
+ },
+ "rope_percent": 0.5,
+ "rope_percentage": 0.5,
+ "rope_scaling": null,
+ "rope_theta": 10000,
+ "tie_word_embeddings": false,
+ "torch_dtype": "bfloat16",
+ "transformers_version": "4.43.0.dev0",
+ "use_cache": true,
+ "vocab_size": 256000
+}
diff --git a/generation_config.json b/generation_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..48aaabbb180a6c12eec92ff6a9dc11edb619bbe1
--- /dev/null
+++ b/generation_config.json
@@ -0,0 +1,6 @@
+{
+ "_from_model_config": true,
+ "bos_token_id": 2,
+ "eos_token_id": 3,
+ "transformers_version": "4.43.0.dev0"
+}
diff --git a/model-00001-of-00189.safetensors b/model-00001-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6c330a664bf99961d167b00cf22d27063f8fc3ab
--- /dev/null
+++ b/model-00001-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3acc010dae170bb2e747754807e46f8210bbcb8020b6d4f7c60d953ea147c0d5
+size 9437184112
diff --git a/model-00002-of-00189.safetensors b/model-00002-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5fa749216bc3c13e3e71a94fc796a9e8e8252d9c
--- /dev/null
+++ b/model-00002-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1241cb0e1c6bef6670a378c7c969b051aed5cff6d09ae884ee97e98a14a383f9
+size 2095055948
diff --git a/model-00003-of-00189.safetensors b/model-00003-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d498550151c1e87ef3546b329ec5dcad2896ce33
--- /dev/null
+++ b/model-00003-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e2b4bc51db835ef4dec7496bcb396b1edc6b10f34edc27d88fa69c691a52052
+size 2095203836
diff --git a/model-00004-of-00189.safetensors b/model-00004-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6c0632e273bcadb29e3b78cd23e8462e0bf9479d
--- /dev/null
+++ b/model-00004-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:81d1c3f14142563bb4a866b916aec8bcdfaf9124daf4a39ae01e87c57b64eda1
+size 1358954708
diff --git a/model-00005-of-00189.safetensors b/model-00005-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5a6899ad862aec9907688c12fec8c0c5f3b80d1e
--- /dev/null
+++ b/model-00005-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:705f8828b4f753269814308145de39324aaf019e4e964d3252b14a53f57d81f2
+size 2095203836
diff --git a/model-00006-of-00189.safetensors b/model-00006-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c7672316df5cab2a0e320415ea45c71c5198c3fb
--- /dev/null
+++ b/model-00006-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30bff5938b807eea5d757ba42bcae23bdd851309fa0a63c28798cfc4795ec59c
+size 1358954708
diff --git a/model-00007-of-00189.safetensors b/model-00007-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..613721c55e06cd038730dbce61753feaea63eae6
--- /dev/null
+++ b/model-00007-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ba4d876816ab715e82b3cbd590bca26607cc80435be87aa1b34e8b4879a8c71a
+size 2095203836
diff --git a/model-00008-of-00189.safetensors b/model-00008-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..938fbd9716f34e890aa1c27a3769a7db33e8d697
--- /dev/null
+++ b/model-00008-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:956379d7ebf47042d0515343dd07abc961761974a26b293155c1353ad4dc79f3
+size 1358954708
diff --git a/model-00009-of-00189.safetensors b/model-00009-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a08c7d9fa2a2b0ae5a664f8fc75c56cffb015f5b
--- /dev/null
+++ b/model-00009-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:35a904ddb2bd0608faf308ae114d19ba866d2ee230ddfbf7361a6ab32a21f155
+size 2095203836
diff --git a/model-00010-of-00189.safetensors b/model-00010-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b0c2613a882ec3ad0055c675c5c791ea112fef9d
--- /dev/null
+++ b/model-00010-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3fd71156f376b05d311369b0448d8ac92374256a3f58f96e39297e5e6cd5a66d
+size 1358954708
diff --git a/model-00011-of-00189.safetensors b/model-00011-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c9012ae53e0643517f55ede72803792749d253cf
--- /dev/null
+++ b/model-00011-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f9d995d696ff479079e4eb2cbfda822620b6565ad393382e920876ec816a7f7b
+size 2095203836
diff --git a/model-00012-of-00189.safetensors b/model-00012-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..de44a7729cbc37163eb8a52de20209d539606c45
--- /dev/null
+++ b/model-00012-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:295995dfdefb76f9915731fbaf0779b7acaa2540fa1c3b52b14f66d78b1f3d45
+size 1358954708
diff --git a/model-00013-of-00189.safetensors b/model-00013-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..45ecd5695a2d2fdf057ada14338d2be728cbc7dc
--- /dev/null
+++ b/model-00013-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:053ad3dfc43503e4b44631eb51d837b3f08c01dbdb44bbb1516e69017967fc83
+size 2095203836
diff --git a/model-00014-of-00189.safetensors b/model-00014-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9623d0d8551ed8f968becd83dd1d24b4dc0812c5
--- /dev/null
+++ b/model-00014-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9fb57eba81ee64c8c6e661e3113a63470c0c9a87e2049d1efa18f44ffdfe1953
+size 1358954708
diff --git a/model-00015-of-00189.safetensors b/model-00015-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..06f8b2ce46696030a59f4300bca80c89501a4586
--- /dev/null
+++ b/model-00015-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d3fa0722515d8dbab46f7787f69d4dab4528f3b85512389e52d06ef9d8f23af
+size 2095203836
diff --git a/model-00016-of-00189.safetensors b/model-00016-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8bdaffd575cb3733e63ae4a422eb7ffc2a8b4b5a
--- /dev/null
+++ b/model-00016-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32d4703552bafa6af8abfde29ebca5c9188c76aea6a01c538ad56c41698151c2
+size 1358954708
diff --git a/model-00017-of-00189.safetensors b/model-00017-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6241d93b0a78b3194f345a16363207066f24a5bb
--- /dev/null
+++ b/model-00017-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c2f42520344ddf8d3623ff183db863903c1887fa4043b8abd8d2969223182a67
+size 2095203836
diff --git a/model-00018-of-00189.safetensors b/model-00018-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7519de0f1723bb8f2fbe5ded05e52e4a5756c991
--- /dev/null
+++ b/model-00018-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4e60bb195f7a89f3ce350f3dd3eaaab44dfc2ce3eda8a6842428b6834b8f222
+size 1358954708
diff --git a/model-00019-of-00189.safetensors b/model-00019-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2ffc060fb2965d0e02ae08ab16880ebe62ca46b3
--- /dev/null
+++ b/model-00019-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d78907097c3dd061e20bdd069c380f2b8c936c72a32bbc8573c25445866d783a
+size 2095203836
diff --git a/model-00020-of-00189.safetensors b/model-00020-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3c2a4412e5ff191e04846576651e42ca79034429
--- /dev/null
+++ b/model-00020-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30564d2900e111d7a12c4413548c3f4e4dbe701e7ad156b257ce691ef4e4bbe2
+size 1358954708
diff --git a/model-00021-of-00189.safetensors b/model-00021-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0f4b1e13b0891ecee1918c668755d4d457e2e3cb
--- /dev/null
+++ b/model-00021-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:53eb12fde483fd0cc9ce9a010e74d443bd3f007eb556adbbc6a228a217b29216
+size 2095203836
diff --git a/model-00022-of-00189.safetensors b/model-00022-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fb1915df11fe23699c15d50215d1fdbc13ad66e2
--- /dev/null
+++ b/model-00022-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf3d8e9f1308ec0e7ae25e7e0bc8c8b58ad895d830d9eb3c2ffba0608ff06a5b
+size 1358954716
diff --git a/model-00023-of-00189.safetensors b/model-00023-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..37eae380d61485df36aace90fd697202de0927b9
--- /dev/null
+++ b/model-00023-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7e124bc9daafbe95d926b6f1aee1d1707bec80f4bf34ad930ef2faaa4484f6ce
+size 2095203852
diff --git a/model-00024-of-00189.safetensors b/model-00024-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..86a499d20f8247a2b25fc0ae5b033b2c1e9c9586
--- /dev/null
+++ b/model-00024-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:177ca5c3def9898b2e848e096d8e835a646194ac70059f99d5378e9abccc98fb
+size 1358954716
diff --git a/model-00025-of-00189.safetensors b/model-00025-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b30060d1c331ccc369153528c7bc11f2fdb79e46
--- /dev/null
+++ b/model-00025-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c8425b9192b8d81a7768ca39036b945d82120df5dbb32171b5e229e26390775e
+size 2095203852
diff --git a/model-00026-of-00189.safetensors b/model-00026-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d87b4e8481037f3ed046d6aa6808209468efa389
--- /dev/null
+++ b/model-00026-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fad56578b0306c3bf9685f276692c1da378880af876b4c6d8b4f91277abcb561
+size 1358954716
diff --git a/model-00027-of-00189.safetensors b/model-00027-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bffad9b9f406112a0079e624c4bfeac999cf79f7
--- /dev/null
+++ b/model-00027-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:601fa83dc9bea36ab1bbd3fded2092737f12eb5820cb6c1812fc4772b5e191a0
+size 2095203852
diff --git a/model-00028-of-00189.safetensors b/model-00028-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6891ffbb48af6770d90563bc333dc3faf8804a6a
--- /dev/null
+++ b/model-00028-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c4afeacd8653af6e30f1bcca18bce2488451e7678efb8595c6e9d7f399fbebcc
+size 1358954716
diff --git a/model-00029-of-00189.safetensors b/model-00029-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0fb99e77aea25e8c3dca66b7e154a15aa6c04964
--- /dev/null
+++ b/model-00029-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:974b92a564f3044c31d221f964069f7afa39eb4795db70f01c441ad4f0e4bc62
+size 2095203852
diff --git a/model-00030-of-00189.safetensors b/model-00030-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8ed619c3585746b4fe76b27cfda7dc9e761f72e7
--- /dev/null
+++ b/model-00030-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df044bb15845c94511169782387829e0f86ec76faa624e8cc730f2ad958ecb4c
+size 1358954716
diff --git a/model-00031-of-00189.safetensors b/model-00031-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7205c7907ab55bb30ec53710562ff987a9803702
--- /dev/null
+++ b/model-00031-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:01b5321072213be3510952662088fe206a56aaf13020076b6b37b0fb5f9f1370
+size 2095203852
diff --git a/model-00032-of-00189.safetensors b/model-00032-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e08d6b0255b51582fdf82d0be8e7f50ca38befaf
--- /dev/null
+++ b/model-00032-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:65ecd6b00a57a54f9b9f856311f9637d99663000014302f54c36297fa8edda1b
+size 1358954716
diff --git a/model-00033-of-00189.safetensors b/model-00033-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..36da41d9049df8f4851a87c8644834ed58280c89
--- /dev/null
+++ b/model-00033-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:45454e5dc4f630f0ad3bdd55e65570c91c6665211b3b095be94a8550b43ab33e
+size 2095203852
diff --git a/model-00034-of-00189.safetensors b/model-00034-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1b151dc97d41985156ad3a6b6f6795da69982eff
--- /dev/null
+++ b/model-00034-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e32f6c316129612855ccfc9ea8a2635fc30545cfb9f22fb2f178e01537846f7e
+size 1358954716
diff --git a/model-00035-of-00189.safetensors b/model-00035-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..049d80d42ba35a55737ac9edbf43bea0fc4c806a
--- /dev/null
+++ b/model-00035-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f0da9a282090aaf8dd5e02468b89b71f8ed16c8b830d42a941e30470976b07c1
+size 2095203852
diff --git a/model-00036-of-00189.safetensors b/model-00036-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..87ffe616e1d927c51bc52fa1e2e29fee5198c11a
--- /dev/null
+++ b/model-00036-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a76de48532a89f6f0986a2827c3f0a79ec51a24c7a7088885d742d4a543cc8e
+size 1358954716
diff --git a/model-00037-of-00189.safetensors b/model-00037-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..79131df048d28b04dde81e4a3724b67c5e460c83
--- /dev/null
+++ b/model-00037-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e32eee7f6f95cc5a5ee279433659ad6b1463d488f1fefa2cc4c7fe677884a490
+size 2095203852
diff --git a/model-00038-of-00189.safetensors b/model-00038-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ba125d1522a186fb21b65de51a11a591080d6def
--- /dev/null
+++ b/model-00038-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f6f1918e4ff4095d942458288e2f4a1f9fa51a09321bba7fe043d53744c4886
+size 1358954716
diff --git a/model-00039-of-00189.safetensors b/model-00039-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ea3f39daac4cc74e2c9be6d31433274370f381fd
--- /dev/null
+++ b/model-00039-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bbba97b91379b6d4c51e4bb0636231dc0735848b41fb2b376e8c23df1baaac4a
+size 2095203852
diff --git a/model-00040-of-00189.safetensors b/model-00040-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3337305125dd99f0b758db71af60372e15fbc333
--- /dev/null
+++ b/model-00040-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7f92c091572ff317063ec352b0190ae9c654e67bccac623d4298980c02ff15f1
+size 1358954716
diff --git a/model-00041-of-00189.safetensors b/model-00041-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5857e822fbda7be98a499c0b9d06e7aca5e1bee5
--- /dev/null
+++ b/model-00041-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b760acd1baa08564d006fbd5506e3c327ba0808a48c85cf532064f868a32bbfe
+size 2095203852
diff --git a/model-00042-of-00189.safetensors b/model-00042-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..00ff0f079a4f29ecf799b03450870d1973a1aa24
--- /dev/null
+++ b/model-00042-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ded4f3360b3c85a14c7e3a55b60e2c4ec8ae9fc7c7f9030c36436348d13423c9
+size 1358954716
diff --git a/model-00043-of-00189.safetensors b/model-00043-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..25d2cfc37ab00b78532e578ac81a3e0af9fd1ac5
--- /dev/null
+++ b/model-00043-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4f3f1a4d732e41751b65dc0566abb5daf04d2746204511d76e262d47f3076447
+size 2095203852
diff --git a/model-00044-of-00189.safetensors b/model-00044-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d0a3960bd3afcefb21435b54c9a7cbda155c7cbb
--- /dev/null
+++ b/model-00044-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74a4a2b4096e276890ff25b779b653535ce4cb3c5dbeb39f6b7be408d997900f
+size 1358954716
diff --git a/model-00045-of-00189.safetensors b/model-00045-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e68126b1d36ca1e608bdae2c80e18d6db0bd38e4
--- /dev/null
+++ b/model-00045-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b2c0c82b56ac317fdfc36ceff7257a731732326e7700d8a38329f520ac09c403
+size 2095203852
diff --git a/model-00046-of-00189.safetensors b/model-00046-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..326f03200bd82f07bb6260b601b7ef13d87034b7
--- /dev/null
+++ b/model-00046-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82e62e7a891fe44ae1d5a237b0f0285ea60a5ee1bb117bb83cf10e92322dd021
+size 1358954716
diff --git a/model-00047-of-00189.safetensors b/model-00047-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..82b44ea0f6315b57e9d9746c1881612f00c7bcfe
--- /dev/null
+++ b/model-00047-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8eca8f41a8eebc4a8e08ab59041c2942895ccdea4d7f8dcb003e1f878ad699fd
+size 2095203852
diff --git a/model-00048-of-00189.safetensors b/model-00048-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d1ef08c8db4015000cedb6da6fcff7033c29a920
--- /dev/null
+++ b/model-00048-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d1cfbad5360619e143ef08010e81496c71f49432f78928da1c86c0b0c1a7285
+size 1358954716
diff --git a/model-00049-of-00189.safetensors b/model-00049-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..496f74b32b7e9d0216255b519216fc4bf6640bc7
--- /dev/null
+++ b/model-00049-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:585cc6fbe7238d38b431536256bc3ebe645342448421c0e40b8b2309648b8069
+size 2095203852
diff --git a/model-00050-of-00189.safetensors b/model-00050-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f1e98eb2b7db834912f9e9cb6588c585a94260d1
--- /dev/null
+++ b/model-00050-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:629731503ffdbba2cc912a373c624d4a5581379f6a940d9a93d4b1f82a91b617
+size 1358954716
diff --git a/model-00051-of-00189.safetensors b/model-00051-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7c90291350e935ec0e752d70b3d19ecd4aeef5cb
--- /dev/null
+++ b/model-00051-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6ee2dc51f841bafacaeb0a6476e73a2870e2465eb15d341e2ec86b4f84732150
+size 2095203852
diff --git a/model-00052-of-00189.safetensors b/model-00052-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..442b23903c6034e165816a29abbf8d0cbc6e4c2b
--- /dev/null
+++ b/model-00052-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1287587817b7acd0949440c760bd707915be8f35b5d0fed7869fd9b74f8a8dc0
+size 1358954716
diff --git a/model-00053-of-00189.safetensors b/model-00053-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9858b8bc2f411fed3ce5e248114625e97fefadfb
--- /dev/null
+++ b/model-00053-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fc6b4da7b048e20626db0b7ccbf4ae065800cee557147825a8a43034b5e24f32
+size 2095203852
diff --git a/model-00054-of-00189.safetensors b/model-00054-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..79d3910e1c09b435f26728993922cc5f6bc5f4b4
--- /dev/null
+++ b/model-00054-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b12511a75f27a4a1e2ad3163e646e44bea7d4f9a6c9c4976f9d4bdee0eefc2c
+size 1358954716
diff --git a/model-00055-of-00189.safetensors b/model-00055-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cb4599b51c6db0ecd5e07b487a7b300559b4cf33
--- /dev/null
+++ b/model-00055-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0889391451b3283a020e3d435dca139ce1d2a5405d5bf6a690076795506e523b
+size 2095203852
diff --git a/model-00056-of-00189.safetensors b/model-00056-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9410d9ee59c10d2c2be80d2309125e699fee4e80
--- /dev/null
+++ b/model-00056-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32b5c5d94c97c0070b5bc1baabc44c65e9c9f4799dbe7615439699dc9955996f
+size 1358954716
diff --git a/model-00057-of-00189.safetensors b/model-00057-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c64a16a1cad6d601fbb0d964b50b6d0ee41d60d2
--- /dev/null
+++ b/model-00057-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1c9aa40429fa8779f20fa6925e7bcd746cc3e960d677b5e0a401eaa3bbe49b3d
+size 2095203852
diff --git a/model-00058-of-00189.safetensors b/model-00058-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e63f3957b28072e4cb5a71d060c7080f05899965
--- /dev/null
+++ b/model-00058-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d44301a4a1266ad6b406e2f7fbb84105b20eaa52096f024c0896efb82056cbb2
+size 1358954716
diff --git a/model-00059-of-00189.safetensors b/model-00059-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7e4273cbc8ac6ad5f7c3ab65885308e3fdeb595a
--- /dev/null
+++ b/model-00059-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7c9ed620dec9892da9eb3e64ec1d29fbe3ccb94756dbc4b7d5dd0f9d32f52cff
+size 2095203852
diff --git a/model-00060-of-00189.safetensors b/model-00060-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5ec558bdf2d3da323c82b091518ac615d00f1772
--- /dev/null
+++ b/model-00060-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:46e7de2bacf824274ced48543999ca7844f8cf9588d2c19348d72f104fcc2003
+size 1358954716
diff --git a/model-00061-of-00189.safetensors b/model-00061-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6ca1615f890b1f2baa6ad27b32e461e224e6a9d9
--- /dev/null
+++ b/model-00061-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a8b6063e1d6a6ea5e53b804973fdc24776ae2e33481d5f830bda1cc2e63afeaf
+size 2095203852
diff --git a/model-00062-of-00189.safetensors b/model-00062-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3aa19e7275e17b1a416fbaeba563f015ade4cc44
--- /dev/null
+++ b/model-00062-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:01914ee4228a47918aaf1e728f0f9beca40295e83cf17ee05a588ac68924a798
+size 1358954716
diff --git a/model-00063-of-00189.safetensors b/model-00063-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c99509da339ebc5760d68b0052870bef5ade0e4e
--- /dev/null
+++ b/model-00063-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6de3b35d9e4e494e0e9ca98dd1bcfd2a8830dab08cb1a5cff964a86725154b98
+size 2095203852
diff --git a/model-00064-of-00189.safetensors b/model-00064-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a4d8fa6071560f6493a80807d98a6645f77baa72
--- /dev/null
+++ b/model-00064-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3531578cd7dd5a413c4a80fa64243752cf7191f143fe8b9ec2ccb3732a4b3f87
+size 1358954716
diff --git a/model-00065-of-00189.safetensors b/model-00065-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9d5a3548bc4354074f6b044aacaed3547102e007
--- /dev/null
+++ b/model-00065-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:647b1f02b882ae40ad602daa39335cf76e88fb0b667b199e88acd54b496e0011
+size 2095203852
diff --git a/model-00066-of-00189.safetensors b/model-00066-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..81fec8cf0ee076b638b302ff877dc70e0495c740
--- /dev/null
+++ b/model-00066-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:200440e5f25f6e092b988264cc54eb0baca8b15e3983a8915a7e0f8b00911b4a
+size 1358954716
diff --git a/model-00067-of-00189.safetensors b/model-00067-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4dbcf9105d184162bf23306350e61bfc2bbd23b0
--- /dev/null
+++ b/model-00067-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c13899c43cb8237314278ec836848ec1d649fff24e1fd46c026321449593ad70
+size 2095203852
diff --git a/model-00068-of-00189.safetensors b/model-00068-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..56fa10d913bd8d5fbc121cbf90dee99c08fe7819
--- /dev/null
+++ b/model-00068-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:973db23564329c1e69b7722fa288cacd89727b65013b6c10b99e45cc2df492ba
+size 1358954716
diff --git a/model-00069-of-00189.safetensors b/model-00069-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..39dc50afa23e6c539d46c3aa734b6a4f98b2b8bb
--- /dev/null
+++ b/model-00069-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bd011f924ff9e40ec355a57bf3415a80cb969d7504f3ef75d7367aeba1af975d
+size 2095203852
diff --git a/model-00070-of-00189.safetensors b/model-00070-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7ea53a660aa45b5ec12ee8936bd19ea803f0f3c9
--- /dev/null
+++ b/model-00070-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d3c2486cfb0d233ffca6291b5ffdb505e940fd1a5ee5dcbee2629bba20bba9c
+size 1358954716
diff --git a/model-00071-of-00189.safetensors b/model-00071-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c88ad36fa8a1887271159d38da95ac5a74fc3e80
--- /dev/null
+++ b/model-00071-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f19afd445f2783aac082b84dee2f432f9841d0430f37b50490d23899baa8b95b
+size 2095203852
diff --git a/model-00072-of-00189.safetensors b/model-00072-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4227b9bd8c78beb41505815a4c761ae12dfaaa85
--- /dev/null
+++ b/model-00072-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0bdbfdca2fb791d7038be60dd199b787f6822b505751f451a79c03869ccdfe35
+size 1358954716
diff --git a/model-00073-of-00189.safetensors b/model-00073-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..68e5348eab9ac86bd722daf119b98c8c9d0b6b0d
--- /dev/null
+++ b/model-00073-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7ac1444e11c689491e765da06760149d80e13819b00e7566bc8174709104f4d7
+size 2095203852
diff --git a/model-00074-of-00189.safetensors b/model-00074-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e2768ed82b0a981ccdccfde139b49b581a0231d2
--- /dev/null
+++ b/model-00074-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4883fb98e63f9a0ebd92e6c3558e4f1a91eba5cf1395bff99b564001f200d255
+size 1358954716
diff --git a/model-00075-of-00189.safetensors b/model-00075-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1eee3c46143aab63e3697ce642808a39ad9744ca
--- /dev/null
+++ b/model-00075-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7f27b923990b9eb4f0431acb3e0133270751eba78593fbe5f22ee2b294cf41df
+size 2095203852
diff --git a/model-00076-of-00189.safetensors b/model-00076-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8c520c21e25ddefa168763dc1b592ef796112eaf
--- /dev/null
+++ b/model-00076-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2b5383f1873fff0cee01ad6e82882077ef7e4e75669ae40bbf8324ddb418a369
+size 1358954716
diff --git a/model-00077-of-00189.safetensors b/model-00077-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9925fcc8195bf1b2d4954e4b0c32f22bacb2fb4b
--- /dev/null
+++ b/model-00077-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1bfc8f8dcfda572d58be0e076a9d8fb627aeb4e5508a1009a41452333a205b9d
+size 2095203852
diff --git a/model-00078-of-00189.safetensors b/model-00078-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..35306a0cdee36d349ca49e9bcd8942fd001e5021
--- /dev/null
+++ b/model-00078-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c2920e5838664fc8d9a30db1b424c503039b4e093b52795c9390d5b1f53c474
+size 1358954716
diff --git a/model-00079-of-00189.safetensors b/model-00079-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b34ec6dba347252ab6ac509915ab30f6b5364b5c
--- /dev/null
+++ b/model-00079-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fa08d2afeb644da068852449d57589d8b4085e98ec022ef04d3b2be6671fbe55
+size 2095203852
diff --git a/model-00080-of-00189.safetensors b/model-00080-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3848a16fe35aa5e1974af65aed2b1221706b97ee
--- /dev/null
+++ b/model-00080-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:42c65f0a8bae6fa599ae19a785d4b0f2834168a9ef49cc2777d9201cf3b55e71
+size 1358954716
diff --git a/model-00081-of-00189.safetensors b/model-00081-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..087da060ddcb99c570622326948ea1009e1bb001
--- /dev/null
+++ b/model-00081-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:85ac2ca05b05ff5dd8ccf57d8b7582f85143766fc07f4958afb46d95a6770ea8
+size 2095203852
diff --git a/model-00082-of-00189.safetensors b/model-00082-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6201cce042dd8fdc1c15993921ca9597015dd53f
--- /dev/null
+++ b/model-00082-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:02c5a7094d83d1339be01711bc7ededa13691d588ca921d60e1269fd02c98c48
+size 1358954716
diff --git a/model-00083-of-00189.safetensors b/model-00083-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7331cfcf62d1d483f34bf3d5132a248d3c6cd03d
--- /dev/null
+++ b/model-00083-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e0c58831a0d00c09a4c60725ba46b7e4ce77fef2eb8c7d8dff7b660095572b10
+size 2095203852
diff --git a/model-00084-of-00189.safetensors b/model-00084-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..370a056046c6d0e19e7f99280ac4e60ec0f0f647
--- /dev/null
+++ b/model-00084-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1cf564c5bfaa74fe54f2bb93332608c3f64ea34c6878bba46cbd97c0e099388d
+size 1358954716
diff --git a/model-00085-of-00189.safetensors b/model-00085-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..778ad3b10eaf3312c748fabf61787097145bedb9
--- /dev/null
+++ b/model-00085-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:54612a5ee182f878ae023e3abd6f025b1c23695c673220c8b1e4a4c83df3de5f
+size 2095203852
diff --git a/model-00086-of-00189.safetensors b/model-00086-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..22d44820c4049d8d64e432927c67c89b17cdc9b2
--- /dev/null
+++ b/model-00086-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ecb5a0be2cfe386a2fbf4a3ac21e37288e2c89e2863fd5241b6b7bcd1265a02
+size 1358954716
diff --git a/model-00087-of-00189.safetensors b/model-00087-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e5726d2311316876002870003cc21d47bf144cb1
--- /dev/null
+++ b/model-00087-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05043d87540fa4d909ac395aa2763c9a72e292c804cea9a1b6cb66a89d1cd2b6
+size 2095203852
diff --git a/model-00088-of-00189.safetensors b/model-00088-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..157c5c9375ca57a101034704a65c89663ba31869
--- /dev/null
+++ b/model-00088-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4ae9719d7588c746e4b47de5092a475d79cbf082cf0a9db5ee8a8eb7d9a5e521
+size 1358954716
diff --git a/model-00089-of-00189.safetensors b/model-00089-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a6d2d1df02234118da7bff3671e789be1617c472
--- /dev/null
+++ b/model-00089-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:27d64abc95122734df0182fa6983a3c9fd72264d1d05aa80ef64b81d3201ac3c
+size 2095203852
diff --git a/model-00090-of-00189.safetensors b/model-00090-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..16e4a48a2ee202b73c0e82475e78daeb5d57a723
--- /dev/null
+++ b/model-00090-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1227c633dceeaaf21e4874e72b4b502c9286e63c15b8f4d59a06d3732dd82c3d
+size 1358954716
diff --git a/model-00091-of-00189.safetensors b/model-00091-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..06983d875c647e2153516f3d9ad33c425a6956a2
--- /dev/null
+++ b/model-00091-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:03284117586962f32a59f0f6bb75f54d5e1bbe71005ff6742e83851ad669063f
+size 2095203852
diff --git a/model-00092-of-00189.safetensors b/model-00092-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a31a70a45bfc4904404e69613405e4e128a515f7
--- /dev/null
+++ b/model-00092-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f555f575d42dade93afa1d2d7f5050e353025aedc4671a7bc082c76bc6e7f5e9
+size 1358954716
diff --git a/model-00093-of-00189.safetensors b/model-00093-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f73680df4afe16ee3125a84930a969d5c3fa3f6b
--- /dev/null
+++ b/model-00093-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c994b63819d124d3502f3b321845155bf4ceddc77b36345575ea4ad84c6b647d
+size 2095203852
diff --git a/model-00094-of-00189.safetensors b/model-00094-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a452223f9ae84e68e8b25e8a406b0b5adf2c91b7
--- /dev/null
+++ b/model-00094-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b23ca84563b2e51ecf0b51ec10315c10a3180ec03c491d71f3ddc954309e9c54
+size 1358954716
diff --git a/model-00095-of-00189.safetensors b/model-00095-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bfea084546443c9adf5dafd053c15f0a75fe438c
--- /dev/null
+++ b/model-00095-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32a5d681513c2386713b0126aeaa948d9f8580307b458c051e35dbf79f2632ad
+size 2095203852
diff --git a/model-00096-of-00189.safetensors b/model-00096-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f804a37653f8d9ad08d3ddbf39ebda00324182a8
--- /dev/null
+++ b/model-00096-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f603d056be77baa9d1d26b14d050388e327c8590558bd6794ed758064988e66c
+size 1358954716
diff --git a/model-00097-of-00189.safetensors b/model-00097-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..83bd9e6c8fa0d86a591b28b333dfa7c79c5f1fac
--- /dev/null
+++ b/model-00097-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:308c63c68cfe109c6230cef727a8011a95a89dd86204e05dade05b31e6945403
+size 2095203852
diff --git a/model-00098-of-00189.safetensors b/model-00098-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3e65641972b1a48ea6e63d5cebefd4f47048f7b5
--- /dev/null
+++ b/model-00098-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d424cf33e05c0fb2643a95be5d6f8005edb3421a9f9c16a1ffff0e1135ceca9
+size 1358954716
diff --git a/model-00099-of-00189.safetensors b/model-00099-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..18855faa1bfd31d8f5080ddc48b4196104173bca
--- /dev/null
+++ b/model-00099-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:819b2c0c6772a078d28433cc6dea707f5771d2d5dd204d9357d66fa818f11c3e
+size 2095203852
diff --git a/model-00100-of-00189.safetensors b/model-00100-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a5f1dddbb0ec460ba88171743e9068d81a4e541e
--- /dev/null
+++ b/model-00100-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:184a323d3158f05ff77219ac3031d165c9b94ed24c0314a645cca2c18117b678
+size 1358954716
diff --git a/model-00101-of-00189.safetensors b/model-00101-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..68e6a437540a3ea3b525187f00103c6b7e2d1a98
--- /dev/null
+++ b/model-00101-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:06e9bdd310159cc69a6fce1e7df4912f7e220bee32e3cf26d3fa0152658c6816
+size 2095203852
diff --git a/model-00102-of-00189.safetensors b/model-00102-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f45baee8e81e0252b8fb4801d0f802802e9cc68a
--- /dev/null
+++ b/model-00102-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3aec0f4274cb3bbf92b17e7d556cca524b6d576aabebe158fca9f10d9276100d
+size 1358954716
diff --git a/model-00103-of-00189.safetensors b/model-00103-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2debc052727bdc2a66cd67477b97f1bebf933f44
--- /dev/null
+++ b/model-00103-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e419f3a456e88e2e77afc1d16d003c9cf4ee1e9d7e84a67154b73058a4adc7c
+size 2095203852
diff --git a/model-00104-of-00189.safetensors b/model-00104-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e264ebcf3746939b32abada79319366f303058bb
--- /dev/null
+++ b/model-00104-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f575176703c9e968691fddde73a574b61104a45c5857945f78d9786113b65ab
+size 1358954716
diff --git a/model-00105-of-00189.safetensors b/model-00105-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8cbe74704f90e602bef1ba7cf22b84a8a2966a93
--- /dev/null
+++ b/model-00105-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4869dde8048201fe2593f60f08514be1cf4dc34f1195eb55ad48bee56a2badcf
+size 2095203852
diff --git a/model-00106-of-00189.safetensors b/model-00106-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..68d4636c23ef1e33e95cc893d30fc0fd8fd1a1d9
--- /dev/null
+++ b/model-00106-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a54e9f87f79d6ff8336a39219608e19b3633c66322342fec6ce4306bcabcb355
+size 1358954716
diff --git a/model-00107-of-00189.safetensors b/model-00107-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1dc66bbc6ccaeeda92257b08db4532fe95081a1e
--- /dev/null
+++ b/model-00107-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d3debdd320de09f09a5a2e38702325fca713ae6586c7a9826dfb31773a9cc5b
+size 2095203852
diff --git a/model-00108-of-00189.safetensors b/model-00108-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7f4e91b5393005ce70f7a8443049afba819ae755
--- /dev/null
+++ b/model-00108-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b0fd4a542fdaf4eeb5e84208437953944a59a9c612a3d677c17825afaeecc720
+size 1358954716
diff --git a/model-00109-of-00189.safetensors b/model-00109-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a922b3413e5e15a6f9c4b30de319b3ebfa675845
--- /dev/null
+++ b/model-00109-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37bd1cb6534eca4228a436ebb29db377c2bca51a342191fdcc5b737ffe16cff8
+size 2095203852
diff --git a/model-00110-of-00189.safetensors b/model-00110-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..41ea8541cb864bfedcb416c9704fa2c710e27434
--- /dev/null
+++ b/model-00110-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be310bc67218f32e2b4cbb477324cfad8a74f2d4edab3259ef6e4444fada234d
+size 1358954716
diff --git a/model-00111-of-00189.safetensors b/model-00111-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3bcb9d54af1acf045a7fc682a154883196c1f1f1
--- /dev/null
+++ b/model-00111-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a1687f7db1d8f604584451ecf02207afb0667242e45010e890e6b499ef792ded
+size 2095203852
diff --git a/model-00112-of-00189.safetensors b/model-00112-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..868d17a42875c307dc26661831eea99cea7bac0d
--- /dev/null
+++ b/model-00112-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf1be021c1363d59970ea9fc89ca37c9dcf744f379d79240a44de9d95a94251e
+size 1358954716
diff --git a/model-00113-of-00189.safetensors b/model-00113-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d5d4d1eb5cc15a9b64b5d3631b3e4a89ebfdfe83
--- /dev/null
+++ b/model-00113-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86518b5cee0d899022fb3b35aedb9cc2ce530b6a3136ca69ad05957be3c613e1
+size 2095203852
diff --git a/model-00114-of-00189.safetensors b/model-00114-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..413eb1fec4e5d79535f79d77bfa220fe769ff4cc
--- /dev/null
+++ b/model-00114-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fed002910bdbf663096a1c8178b19d5367d5ba239c50604017f19b66b7872441
+size 1358954716
diff --git a/model-00115-of-00189.safetensors b/model-00115-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2a5d2206d7a4f5cc6291e0951b53cc5593f7f721
--- /dev/null
+++ b/model-00115-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d70a079b70291425bd30e88f58cfda33a137aa8bc45c3f743b8fde4b4d833cc3
+size 2095203852
diff --git a/model-00116-of-00189.safetensors b/model-00116-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a385affc3a95301b779f758ef2994e23adcd7e29
--- /dev/null
+++ b/model-00116-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:789d885c948e9b6fc18b1012e971ebacb68eae2b7cf4c050e912783533ea5b5c
+size 1358954716
diff --git a/model-00117-of-00189.safetensors b/model-00117-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8aed6da15fe849a038841aa07135ec1afad3112f
--- /dev/null
+++ b/model-00117-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e935f57e1ed80795c35ef89ff91179d2404bb4c0594324844ef5a8689882d044
+size 2095203852
diff --git a/model-00118-of-00189.safetensors b/model-00118-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c4457ecb331cd3d4e3b18f17b267f4a827a120b1
--- /dev/null
+++ b/model-00118-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d253b4bf6f326adf3861dc49cb8dd5fdf48a013fca2221491e0ce04459728c6
+size 1358954716
diff --git a/model-00119-of-00189.safetensors b/model-00119-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..969b6be4a2d226153a22685dc368ebfb437a9258
--- /dev/null
+++ b/model-00119-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7e32e66077d103c76c4505320e99720eed4292bff73dc3fadf03e41b171de0ed
+size 2095203852
diff --git a/model-00120-of-00189.safetensors b/model-00120-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..711543717ddfe516a477738a2308ed428fa8c5d5
--- /dev/null
+++ b/model-00120-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:15be7b7e2ce582b7641bad762af0ebed039456f4232de57df16dbc2bb2d0f52e
+size 1358954716
diff --git a/model-00121-of-00189.safetensors b/model-00121-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..971e796deeb5b8d787f6d16eea6300b0d75736bd
--- /dev/null
+++ b/model-00121-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfef6653784e89cb8e3d449474520d7ad99bfd3dda2df47a8b9ba9b6b3482e62
+size 2095203852
diff --git a/model-00122-of-00189.safetensors b/model-00122-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..11ad603f2b1da9b815c086393ece3f660a3cb190
--- /dev/null
+++ b/model-00122-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd4d5a6b997eafd94d68235ef75a6dc5decf4c2a742af547d2831d75369bdbee
+size 1358954716
diff --git a/model-00123-of-00189.safetensors b/model-00123-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2b0810ef1635ec1249836c5971348a40ca344842
--- /dev/null
+++ b/model-00123-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5b7874ce775a378b543ae39b4bc1556f0f82f252823ad98a13472d6dc73633a6
+size 2095203852
diff --git a/model-00124-of-00189.safetensors b/model-00124-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..50fc73b0e815d67719bdb3989a280fbe80779fa5
--- /dev/null
+++ b/model-00124-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9abd92df4bf7866df8c7b68ad55b032705abd79651d6b257f2ada92af7b289b3
+size 1358954716
diff --git a/model-00125-of-00189.safetensors b/model-00125-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..84a57d2cf81b077eed549a477fb00f6da8931ca3
--- /dev/null
+++ b/model-00125-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5af2b9547431296fbb6ae592d1ea4d03c56c84bd1da2c4d0e775756036fac844
+size 2095203852
diff --git a/model-00126-of-00189.safetensors b/model-00126-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ba8bae0b96990fc8a634273c30d112c7d0449aa9
--- /dev/null
+++ b/model-00126-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:96635cd1dde375685f787251cc3281532dfd6aa24c3674e82f020f226ccaad03
+size 1358954716
diff --git a/model-00127-of-00189.safetensors b/model-00127-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d9ea42e07e8a73687899edd48b02e43acf184616
--- /dev/null
+++ b/model-00127-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:02c6e85c1c1637cc55a75af3a679aac1d848760ee0276acfaba90c3c40f75b8c
+size 2095203852
diff --git a/model-00128-of-00189.safetensors b/model-00128-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5a52c755f528dba24347bc588b7a2007a5a24444
--- /dev/null
+++ b/model-00128-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb1c62b737735e208d21256f7600f31f67b8548890c47625dc8fd6b4c13c583a
+size 1358954716
diff --git a/model-00129-of-00189.safetensors b/model-00129-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..df2e0f07d3483f5a239a67d4110c208669858e67
--- /dev/null
+++ b/model-00129-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:87255f8b454ff1dbab1a831a6a06a8457cd8c3855c2e8671cf3250998401c2db
+size 2095203852
diff --git a/model-00130-of-00189.safetensors b/model-00130-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..db69cebae14b51a0e82b2af8a14d7e40ee222e85
--- /dev/null
+++ b/model-00130-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f725882d4991380c5477c816571498f12c8aee0a082f6391ab2934467e6a834
+size 1358954716
diff --git a/model-00131-of-00189.safetensors b/model-00131-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..520fbfd0449f27d1004a5ee7f97fdd234ab5a0c8
--- /dev/null
+++ b/model-00131-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:70850c9b02d5aa827e5fd5cdc51f9aabb177bef19966c1c207bbeb0de6ef01c3
+size 2095203852
diff --git a/model-00132-of-00189.safetensors b/model-00132-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..20f11d7cf7dbdaa6f694fe149dedba228649a098
--- /dev/null
+++ b/model-00132-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f0d93576f0b509fec066141bc932b9513b5b6357e84dba3cddce85cba2672f6c
+size 1358954716
diff --git a/model-00133-of-00189.safetensors b/model-00133-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..332862dd3725857ebb2be4b97235bf4351b856b9
--- /dev/null
+++ b/model-00133-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b3b227d5029ca7c47eb4076dfd46c845e85d6b12efd4ef4188a692493a6de0de
+size 2095203852
diff --git a/model-00134-of-00189.safetensors b/model-00134-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..025b49ec6c4c3a14400c405f717b92877e07ed6b
--- /dev/null
+++ b/model-00134-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e775b68b1e1aa95372b488039c689ebf24687abf3b67f032188ad6b23a440f6e
+size 1358954716
diff --git a/model-00135-of-00189.safetensors b/model-00135-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ced54b23820f776b4bb01bee9feafc25417c495e
--- /dev/null
+++ b/model-00135-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17cbb3e5437f59ceeaf4e55251669f5a779b17dbd757b5d12a8b6b9ef86804e0
+size 2095203852
diff --git a/model-00136-of-00189.safetensors b/model-00136-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..77d81bdf8004fe8a43cc50065e12f7135212a168
--- /dev/null
+++ b/model-00136-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:43edb264c18c69ce260a4b1df0d35d69a81eca109f05ca6a830b2c8928424419
+size 1358954716
diff --git a/model-00137-of-00189.safetensors b/model-00137-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..609a23ca8fe9ae06be2399b4f762c584a72bbda2
--- /dev/null
+++ b/model-00137-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b496fba8d1af463505c3ec9d4847be05405a6ad3947e4e7ecb99bc4ab4fb971
+size 2095203852
diff --git a/model-00138-of-00189.safetensors b/model-00138-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8eb2e0a6a6cc59ab9a7719bce921aca2e72ae16d
--- /dev/null
+++ b/model-00138-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:036ce35df59ffdbf2b66aaa9b7bf8fd805f7b896b54d7d67ba0185b7e1ad9e6b
+size 1358954716
diff --git a/model-00139-of-00189.safetensors b/model-00139-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..052510818dd3dbe3370ca14df20c90df014b19bf
--- /dev/null
+++ b/model-00139-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f8372b161392ae47f9b40c0f5d206d13e4a1a4d22b1c485a1dad20ac435abbb2
+size 2095203852
diff --git a/model-00140-of-00189.safetensors b/model-00140-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d3517d904aea1a572ee4be61614108a82244807d
--- /dev/null
+++ b/model-00140-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9b6fd107ed26e9b7a759a3e1ed90b6643a0eb5d27ed9b8278fa547f210d52fde
+size 1358954716
diff --git a/model-00141-of-00189.safetensors b/model-00141-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1713d50975078d16cd073032889906763f7ba3ed
--- /dev/null
+++ b/model-00141-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:24c1e676336085096c57a4f7ff2b51108ab533582257457eb6bb37a3145176b4
+size 2095203852
diff --git a/model-00142-of-00189.safetensors b/model-00142-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..69d94b3688c3e91afc59d66a1a84c91ea8c6597a
--- /dev/null
+++ b/model-00142-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d42ee23a6bb789f37d90a7f98df796a5859f650ea40e885387af148b19b83fe
+size 1358954716
diff --git a/model-00143-of-00189.safetensors b/model-00143-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5856f7ac7df8d30b60efd3f6e8c2ac2b848b8c1f
--- /dev/null
+++ b/model-00143-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:193ff1144b00274a13cda5f2eafec036fd65820e7a3964e7d8b9745e5a26d3ae
+size 2095203852
diff --git a/model-00144-of-00189.safetensors b/model-00144-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3ea044ea98281b6fb06d7417fbf5b4a412271c2e
--- /dev/null
+++ b/model-00144-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:54bf87322d63d03430a4bead8462bc8af50f6edc498bf9f00a7087d8e18680a4
+size 1358954716
diff --git a/model-00145-of-00189.safetensors b/model-00145-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..19dcd7cc9e85da5382ed1a0147c965ea5d064ebc
--- /dev/null
+++ b/model-00145-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:26a502ff5406e65630d5f0623ef9e129a5eccd37b6b4ab4a15999346e2be87b7
+size 2095203852
diff --git a/model-00146-of-00189.safetensors b/model-00146-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ccbe98d681a810ec25f3605f962e506e0b310116
--- /dev/null
+++ b/model-00146-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7c0f3b5a8d3f9856373e714f23e054c2ad14fb803992d5e2cc1d2eb16af543a3
+size 1358954716
diff --git a/model-00147-of-00189.safetensors b/model-00147-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5772ecc2122c4075533a62fee7b89de6b4c15b46
--- /dev/null
+++ b/model-00147-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f20d617919b0c63cf09f44a7f24bc6b33346eed1f9e09fa8e06439dd1628051e
+size 2095203852
diff --git a/model-00148-of-00189.safetensors b/model-00148-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..976647484255d7574d8366e0c32f2be21b7ccf32
--- /dev/null
+++ b/model-00148-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4dd85ef72831350e4b3e883e591eac9a77849666745b11e45af416be34a718fb
+size 1358954716
diff --git a/model-00149-of-00189.safetensors b/model-00149-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6c59725b592c38f5d48e71e57ece7e7d73ee7a48
--- /dev/null
+++ b/model-00149-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f6eb4d24c242c6f58e88271c96c7eb40621dc05085f9fb83716bf822922b878b
+size 2095203852
diff --git a/model-00150-of-00189.safetensors b/model-00150-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4c6294c0958b27cf0bc07ec801af2d85b3a2daae
--- /dev/null
+++ b/model-00150-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:06f6d48c2022fd77cd8ec348396bce7d534e4a91160af43b67e379d231229770
+size 1358954716
diff --git a/model-00151-of-00189.safetensors b/model-00151-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bf645e99bdc28df65f151d8d4d81db4cc4decbf6
--- /dev/null
+++ b/model-00151-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:51f3bee571eb9449c413f055d194d971a32dae957d8c1d2ed74e2cc6053bc216
+size 2095203852
diff --git a/model-00152-of-00189.safetensors b/model-00152-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e455b612da5a51271cdb32d426c287250d118c02
--- /dev/null
+++ b/model-00152-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82c6e5c38236501ae3340e757ca0abf7bc17e1b4b38682b780bbb62b933d97e2
+size 1358954716
diff --git a/model-00153-of-00189.safetensors b/model-00153-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..42c3ef3222f28928068bbb4cfa583f6dad408dbe
--- /dev/null
+++ b/model-00153-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f5d8b237fb680a64b14920a878dc15f7b6a67582e934aeee2a1e0e829a2d9215
+size 2095203852
diff --git a/model-00154-of-00189.safetensors b/model-00154-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bdc7c99591621092087d1ff1faad02ed5902c517
--- /dev/null
+++ b/model-00154-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:312a027ff6b4f74d5a697e4aa7c176a3638e6350992703b9c2b3c7cca7f32e07
+size 1358954716
diff --git a/model-00155-of-00189.safetensors b/model-00155-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a5bb68b7c04dc1ad89e1b53ac8d5ab0a01bca871
--- /dev/null
+++ b/model-00155-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:073747061563466f80431652a2e0b1dd0f937c7923b2baf59207c524e434f32d
+size 2095203852
diff --git a/model-00156-of-00189.safetensors b/model-00156-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5dcdfe6345e8b3c9d46af2197ea8284cc47fbbe8
--- /dev/null
+++ b/model-00156-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f485ab05fa7eff13082a9c61d7709baecc5b255da8c6fc65e67ac763af54b67
+size 1358954716
diff --git a/model-00157-of-00189.safetensors b/model-00157-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..421210960f52b4897bbd43088322b908006f6559
--- /dev/null
+++ b/model-00157-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae718696579a232afac7f76315c6ed3495434318b025d5cd1741bad8198a7fb7
+size 2095203852
diff --git a/model-00158-of-00189.safetensors b/model-00158-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a8c91c86369b6311618262087e9cc0477e56483b
--- /dev/null
+++ b/model-00158-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0fe0f96c5d21522391a72445c583100e564d20302412e6f2cf802f9da428c593
+size 1358954716
diff --git a/model-00159-of-00189.safetensors b/model-00159-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b920fd646a015c1bbb5f8061d88a603203a56882
--- /dev/null
+++ b/model-00159-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f7b76e7dd5e18ebad2bc82bff63097cdbd7e62a94b5d5c4fe375dcabe35d109
+size 2095203852
diff --git a/model-00160-of-00189.safetensors b/model-00160-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bb0bac1929f7f98f4c8557b9788a1fae1bceab8b
--- /dev/null
+++ b/model-00160-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:193f611d8ebc1c98b164ee886bff0f6246f67f3d724e6122ef10cbe3801acd8b
+size 1358954716
diff --git a/model-00161-of-00189.safetensors b/model-00161-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..88b340b4e573b507a325b9bc314a7e421b47e9bd
--- /dev/null
+++ b/model-00161-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0498b26c65ca56987fac840096fa7e253841989a473ad9b061778f93b6d391c
+size 2095203852
diff --git a/model-00162-of-00189.safetensors b/model-00162-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bf7ad85e3c1a90a59bc17c51e3f4f36eac850b8c
--- /dev/null
+++ b/model-00162-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9294033ae2c764dc82b3fd84f6b2fa7bc8a46f29005a8a5e5ee81cf08c396a9e
+size 1358954716
diff --git a/model-00163-of-00189.safetensors b/model-00163-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5c738ca6086427bad36b966396bca7b603a03ffe
--- /dev/null
+++ b/model-00163-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:231f9f3a33439451baa655a38b292b76a7d268d48fad5b85203179abad3ba50c
+size 2095203852
diff --git a/model-00164-of-00189.safetensors b/model-00164-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..55db623956e126ec7e9821e31c0719b25e505686
--- /dev/null
+++ b/model-00164-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0bd226d9700755ab2dfc9aef33be200c421b1bdee74148cd9c890ca9a8b2ed0e
+size 1358954716
diff --git a/model-00165-of-00189.safetensors b/model-00165-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..564a55ef210ce3301b67b83a2b2d95db05c5ff73
--- /dev/null
+++ b/model-00165-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a0442e49ffee6c41337d26688cd51b7e1b0c022309dc697ca747ec43e9c31ea0
+size 2095203852
diff --git a/model-00166-of-00189.safetensors b/model-00166-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1f8f2502d84f2309148e91ff670aeac24d9981df
--- /dev/null
+++ b/model-00166-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6c5b345bc1d99c36049c618513a48ced73c688e8794370ddc105c277fdb3241
+size 1358954716
diff --git a/model-00167-of-00189.safetensors b/model-00167-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7e1e00cebacd96234ee219f5dd6580e067eee690
--- /dev/null
+++ b/model-00167-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:274defb697270ac2ba2ceca11890b8476deab085cb35716c72e3b130456f8be9
+size 2095203852
diff --git a/model-00168-of-00189.safetensors b/model-00168-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c5c28afb84a7a3ebb6ad2528dc2148ae69538bc2
--- /dev/null
+++ b/model-00168-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9cf749b42319f0618ecc60bc787c0e6851b117c0273fc31689871b74c9e65573
+size 1358954716
diff --git a/model-00169-of-00189.safetensors b/model-00169-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5581537e090f8048d5119c49fed159e5e3cb7e8a
--- /dev/null
+++ b/model-00169-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:85e584517ba13c65c4a67789da730fa325382a3082d71ca796b9e2408a61bc29
+size 2095203852
diff --git a/model-00170-of-00189.safetensors b/model-00170-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..468837b10fec076a57e26f49afa03122da3c58c7
--- /dev/null
+++ b/model-00170-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:394b0ff02a0da15c87c9fda3c1bce4e121cb46ffcd6fdabc47b529f220155116
+size 1358954716
diff --git a/model-00171-of-00189.safetensors b/model-00171-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e2fe28d99426495b1255cdfe9f92c7334a579b6a
--- /dev/null
+++ b/model-00171-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d07303022df4aaf7c4bdcb1501face4fea88d85fd2efb4f0c360ddcd36644a7
+size 2095203852
diff --git a/model-00172-of-00189.safetensors b/model-00172-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..78b362e99f6efdc1468da6d9f38420b0c72a2be6
--- /dev/null
+++ b/model-00172-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:657fdea905308a7f6e7f84c24ebbfe32cab1958a1a95ed94320f7e529f97c33d
+size 1358954716
diff --git a/model-00173-of-00189.safetensors b/model-00173-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ba9ff604b7263c1954afc0e41bae3c7dfb4f7fe8
--- /dev/null
+++ b/model-00173-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0468e36dcd029aa5777ae5c0e152a713f5b5f8ee659bc11e790e9b28b5f2cbd6
+size 2095203852
diff --git a/model-00174-of-00189.safetensors b/model-00174-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6343b04e5c8283903a10f66e1a206e6a89bae50c
--- /dev/null
+++ b/model-00174-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05017e675c912129a7d148f5d3f4f8b1d313059149697ff2afb6d67f77ed4fc6
+size 1358954716
diff --git a/model-00175-of-00189.safetensors b/model-00175-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0adc080861cef2244247bbb455ecdbd2d8875b16
--- /dev/null
+++ b/model-00175-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:93828889d78b396e5ee1c894923ed80ec04f6b1e18fafe2a51374b52f71b641e
+size 2095203852
diff --git a/model-00176-of-00189.safetensors b/model-00176-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..17554fdee6adaeeff97f681137c330049faee1cb
--- /dev/null
+++ b/model-00176-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:326ed07f1ff016f2b59b6fae10b42c21512319089565cc18d666910579812277
+size 1358954716
diff --git a/model-00177-of-00189.safetensors b/model-00177-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7c474db4c28a7219bd964d6960ff23c9245eb463
--- /dev/null
+++ b/model-00177-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:97d8146466345068c1c8123d7dd47b51b50ac947a263b36617eba104ee54b87f
+size 2095203852
diff --git a/model-00178-of-00189.safetensors b/model-00178-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..62b29677b9c31b5d1766920fa8edb673ea2b4e19
--- /dev/null
+++ b/model-00178-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b6ec4a589402861cf36f9232515be5f6438d301b31f447f309bda4a39c3b1e21
+size 1358954716
diff --git a/model-00179-of-00189.safetensors b/model-00179-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..da5540b1cd2873f08d557d526e05573c9a6a1684
--- /dev/null
+++ b/model-00179-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:db4837c92c2e14fca53af9ef1899cd80018b881479d1feb59579c5fe5c214265
+size 2095203852
diff --git a/model-00180-of-00189.safetensors b/model-00180-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8ae64caf68d3d289aa03470a313995c4cf5e7acf
--- /dev/null
+++ b/model-00180-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:358fe0eaabcbf0a317c0bd6dfaf6bfa6ec5906245f70c591a460d9c36fe60ddf
+size 1358954716
diff --git a/model-00181-of-00189.safetensors b/model-00181-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..70abc80ad6cfddadac601ead1491d0fcf88ecdaf
--- /dev/null
+++ b/model-00181-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e66afe00082018645790fc6d4d936ffd057f28015f42059098fa2a954b5b6cfe
+size 2095203852
diff --git a/model-00182-of-00189.safetensors b/model-00182-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8f0df1949fba7f133e134955294aea3041987e88
--- /dev/null
+++ b/model-00182-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c14945c9ab8424598cd487fc8138d4b82b4988ce3b4a1cff11600d746dd7549
+size 1358954716
diff --git a/model-00183-of-00189.safetensors b/model-00183-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..dcef34227d0246ca2e945379f98d6ff0fdc3a35f
--- /dev/null
+++ b/model-00183-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c110b104051e3de30bc6f546525c149dc1b4c8ec494d4266c59fdc3f7bde3c9
+size 2095203852
diff --git a/model-00184-of-00189.safetensors b/model-00184-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4962b18b792ceea7e6092595eec35d41ac98fa95
--- /dev/null
+++ b/model-00184-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7d2b525fc7e1ad374a76ba131fa49e1e3e6e7f4f3e026e5c53628f2c24fb4a90
+size 1358954716
diff --git a/model-00185-of-00189.safetensors b/model-00185-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d048ad186bf4e0be90b49d1e168c378e9ac4a086
--- /dev/null
+++ b/model-00185-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e3347154a665d1cd5fdb5868c8081fffb7ef9a80f804e8af7c411fa8af810bdb
+size 2095203852
diff --git a/model-00186-of-00189.safetensors b/model-00186-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..81c06f451740d53bcf158f0eb74ef5ddf6342172
--- /dev/null
+++ b/model-00186-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f16d9e7d7e9b06f195d4d376dfed07ab34fe2be1c2a9fb467bebcfba4d64044
+size 1358954716
diff --git a/model-00187-of-00189.safetensors b/model-00187-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7364a8f3b76aa2ccaf9c6691fbfb6e5794df1421
--- /dev/null
+++ b/model-00187-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dce84491f7fe952231ef7c6861d51c6b38de3c204c43eb5cde292d383c4c93c0
+size 3567406348
diff --git a/model-00188-of-00189.safetensors b/model-00188-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cbd09f1006fb584359291cdf98cc1634f7e853ab
--- /dev/null
+++ b/model-00188-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67567822a1e0c2568feb5fc5510b95ef177edb07e067207dfa7770d6f93c51e4
+size 9437184096
diff --git a/model-00189-of-00189.safetensors b/model-00189-of-00189.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..71f17c75d17e6d9fde425f111c235ed41d3438d1
--- /dev/null
+++ b/model-00189-of-00189.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bdaca1e77f53620096e54987f35365a95c2bc760d775488c2a6a4f7b63d8be2f
+size 8154245840
diff --git a/model.safetensors.index.json b/model.safetensors.index.json
new file mode 100644
index 0000000000000000000000000000000000000000..945660c1da523300d1142967dfc94e25c12c9868
--- /dev/null
+++ b/model.safetensors.index.json
@@ -0,0 +1,1547 @@
+{
+ "metadata": {
+ "total_size": 350473664368
+ },
+ "weight_map": {
+ "lm_head.weight": "model-00188-of-00189.safetensors",
+ "model.embed_tokens.weight": "model-00001-of-00189.safetensors",
+ "model.layers.0.input_layernorm.bias": "model-00003-of-00189.safetensors",
+ "model.layers.0.input_layernorm.weight": "model-00003-of-00189.safetensors",
+ "model.layers.0.mlp.down_proj.weight": "model-00003-of-00189.safetensors",
+ "model.layers.0.mlp.down_proj.weight_scale": "model-00003-of-00189.safetensors",
+ "model.layers.0.mlp.up_proj.weight": "model-00002-of-00189.safetensors",
+ "model.layers.0.mlp.up_proj.weight_scale": "model-00002-of-00189.safetensors",
+ "model.layers.0.post_attention_layernorm.bias": "model-00003-of-00189.safetensors",
+ "model.layers.0.post_attention_layernorm.weight": "model-00003-of-00189.safetensors",
+ "model.layers.0.self_attn.k_proj.weight": "model-00002-of-00189.safetensors",
+ "model.layers.0.self_attn.k_proj.weight_scale": "model-00002-of-00189.safetensors",
+ "model.layers.0.self_attn.o_proj.weight": "model-00002-of-00189.safetensors",
+ "model.layers.0.self_attn.o_proj.weight_scale": "model-00002-of-00189.safetensors",
+ "model.layers.0.self_attn.q_proj.weight": "model-00002-of-00189.safetensors",
+ "model.layers.0.self_attn.q_proj.weight_scale": "model-00002-of-00189.safetensors",
+ "model.layers.0.self_attn.v_proj.weight": "model-00002-of-00189.safetensors",
+ "model.layers.0.self_attn.v_proj.weight_scale": "model-00002-of-00189.safetensors",
+ "model.layers.1.input_layernorm.bias": "model-00005-of-00189.safetensors",
+ "model.layers.1.input_layernorm.weight": "model-00005-of-00189.safetensors",
+ "model.layers.1.mlp.down_proj.weight": "model-00005-of-00189.safetensors",
+ "model.layers.1.mlp.down_proj.weight_scale": "model-00005-of-00189.safetensors",
+ "model.layers.1.mlp.up_proj.weight": "model-00004-of-00189.safetensors",
+ "model.layers.1.mlp.up_proj.weight_scale": "model-00004-of-00189.safetensors",
+ "model.layers.1.post_attention_layernorm.bias": "model-00005-of-00189.safetensors",
+ "model.layers.1.post_attention_layernorm.weight": "model-00005-of-00189.safetensors",
+ "model.layers.1.self_attn.k_proj.weight": "model-00003-of-00189.safetensors",
+ "model.layers.1.self_attn.k_proj.weight_scale": "model-00003-of-00189.safetensors",
+ "model.layers.1.self_attn.o_proj.weight": "model-00003-of-00189.safetensors",
+ "model.layers.1.self_attn.o_proj.weight_scale": "model-00003-of-00189.safetensors",
+ "model.layers.1.self_attn.q_proj.weight": "model-00003-of-00189.safetensors",
+ "model.layers.1.self_attn.q_proj.weight_scale": "model-00003-of-00189.safetensors",
+ "model.layers.1.self_attn.v_proj.weight": "model-00003-of-00189.safetensors",
+ "model.layers.1.self_attn.v_proj.weight_scale": "model-00003-of-00189.safetensors",
+ "model.layers.10.input_layernorm.bias": "model-00023-of-00189.safetensors",
+ "model.layers.10.input_layernorm.weight": "model-00023-of-00189.safetensors",
+ "model.layers.10.mlp.down_proj.weight": "model-00023-of-00189.safetensors",
+ "model.layers.10.mlp.down_proj.weight_scale": "model-00023-of-00189.safetensors",
+ "model.layers.10.mlp.up_proj.weight": "model-00022-of-00189.safetensors",
+ "model.layers.10.mlp.up_proj.weight_scale": "model-00022-of-00189.safetensors",
+ "model.layers.10.post_attention_layernorm.bias": "model-00023-of-00189.safetensors",
+ "model.layers.10.post_attention_layernorm.weight": "model-00023-of-00189.safetensors",
+ "model.layers.10.self_attn.k_proj.weight": "model-00021-of-00189.safetensors",
+ "model.layers.10.self_attn.k_proj.weight_scale": "model-00021-of-00189.safetensors",
+ "model.layers.10.self_attn.o_proj.weight": "model-00021-of-00189.safetensors",
+ "model.layers.10.self_attn.o_proj.weight_scale": "model-00021-of-00189.safetensors",
+ "model.layers.10.self_attn.q_proj.weight": "model-00021-of-00189.safetensors",
+ "model.layers.10.self_attn.q_proj.weight_scale": "model-00021-of-00189.safetensors",
+ "model.layers.10.self_attn.v_proj.weight": "model-00021-of-00189.safetensors",
+ "model.layers.10.self_attn.v_proj.weight_scale": "model-00021-of-00189.safetensors",
+ "model.layers.11.input_layernorm.bias": "model-00025-of-00189.safetensors",
+ "model.layers.11.input_layernorm.weight": "model-00025-of-00189.safetensors",
+ "model.layers.11.mlp.down_proj.weight": "model-00025-of-00189.safetensors",
+ "model.layers.11.mlp.down_proj.weight_scale": "model-00025-of-00189.safetensors",
+ "model.layers.11.mlp.up_proj.weight": "model-00024-of-00189.safetensors",
+ "model.layers.11.mlp.up_proj.weight_scale": "model-00024-of-00189.safetensors",
+ "model.layers.11.post_attention_layernorm.bias": "model-00025-of-00189.safetensors",
+ "model.layers.11.post_attention_layernorm.weight": "model-00025-of-00189.safetensors",
+ "model.layers.11.self_attn.k_proj.weight": "model-00023-of-00189.safetensors",
+ "model.layers.11.self_attn.k_proj.weight_scale": "model-00023-of-00189.safetensors",
+ "model.layers.11.self_attn.o_proj.weight": "model-00023-of-00189.safetensors",
+ "model.layers.11.self_attn.o_proj.weight_scale": "model-00023-of-00189.safetensors",
+ "model.layers.11.self_attn.q_proj.weight": "model-00023-of-00189.safetensors",
+ "model.layers.11.self_attn.q_proj.weight_scale": "model-00023-of-00189.safetensors",
+ "model.layers.11.self_attn.v_proj.weight": "model-00023-of-00189.safetensors",
+ "model.layers.11.self_attn.v_proj.weight_scale": "model-00023-of-00189.safetensors",
+ "model.layers.12.input_layernorm.bias": "model-00027-of-00189.safetensors",
+ "model.layers.12.input_layernorm.weight": "model-00027-of-00189.safetensors",
+ "model.layers.12.mlp.down_proj.weight": "model-00027-of-00189.safetensors",
+ "model.layers.12.mlp.down_proj.weight_scale": "model-00027-of-00189.safetensors",
+ "model.layers.12.mlp.up_proj.weight": "model-00026-of-00189.safetensors",
+ "model.layers.12.mlp.up_proj.weight_scale": "model-00026-of-00189.safetensors",
+ "model.layers.12.post_attention_layernorm.bias": "model-00027-of-00189.safetensors",
+ "model.layers.12.post_attention_layernorm.weight": "model-00027-of-00189.safetensors",
+ "model.layers.12.self_attn.k_proj.weight": "model-00025-of-00189.safetensors",
+ "model.layers.12.self_attn.k_proj.weight_scale": "model-00025-of-00189.safetensors",
+ "model.layers.12.self_attn.o_proj.weight": "model-00025-of-00189.safetensors",
+ "model.layers.12.self_attn.o_proj.weight_scale": "model-00025-of-00189.safetensors",
+ "model.layers.12.self_attn.q_proj.weight": "model-00025-of-00189.safetensors",
+ "model.layers.12.self_attn.q_proj.weight_scale": "model-00025-of-00189.safetensors",
+ "model.layers.12.self_attn.v_proj.weight": "model-00025-of-00189.safetensors",
+ "model.layers.12.self_attn.v_proj.weight_scale": "model-00025-of-00189.safetensors",
+ "model.layers.13.input_layernorm.bias": "model-00029-of-00189.safetensors",
+ "model.layers.13.input_layernorm.weight": "model-00029-of-00189.safetensors",
+ "model.layers.13.mlp.down_proj.weight": "model-00029-of-00189.safetensors",
+ "model.layers.13.mlp.down_proj.weight_scale": "model-00029-of-00189.safetensors",
+ "model.layers.13.mlp.up_proj.weight": "model-00028-of-00189.safetensors",
+ "model.layers.13.mlp.up_proj.weight_scale": "model-00028-of-00189.safetensors",
+ "model.layers.13.post_attention_layernorm.bias": "model-00029-of-00189.safetensors",
+ "model.layers.13.post_attention_layernorm.weight": "model-00029-of-00189.safetensors",
+ "model.layers.13.self_attn.k_proj.weight": "model-00027-of-00189.safetensors",
+ "model.layers.13.self_attn.k_proj.weight_scale": "model-00027-of-00189.safetensors",
+ "model.layers.13.self_attn.o_proj.weight": "model-00027-of-00189.safetensors",
+ "model.layers.13.self_attn.o_proj.weight_scale": "model-00027-of-00189.safetensors",
+ "model.layers.13.self_attn.q_proj.weight": "model-00027-of-00189.safetensors",
+ "model.layers.13.self_attn.q_proj.weight_scale": "model-00027-of-00189.safetensors",
+ "model.layers.13.self_attn.v_proj.weight": "model-00027-of-00189.safetensors",
+ "model.layers.13.self_attn.v_proj.weight_scale": "model-00027-of-00189.safetensors",
+ "model.layers.14.input_layernorm.bias": "model-00031-of-00189.safetensors",
+ "model.layers.14.input_layernorm.weight": "model-00031-of-00189.safetensors",
+ "model.layers.14.mlp.down_proj.weight": "model-00031-of-00189.safetensors",
+ "model.layers.14.mlp.down_proj.weight_scale": "model-00031-of-00189.safetensors",
+ "model.layers.14.mlp.up_proj.weight": "model-00030-of-00189.safetensors",
+ "model.layers.14.mlp.up_proj.weight_scale": "model-00030-of-00189.safetensors",
+ "model.layers.14.post_attention_layernorm.bias": "model-00031-of-00189.safetensors",
+ "model.layers.14.post_attention_layernorm.weight": "model-00031-of-00189.safetensors",
+ "model.layers.14.self_attn.k_proj.weight": "model-00029-of-00189.safetensors",
+ "model.layers.14.self_attn.k_proj.weight_scale": "model-00029-of-00189.safetensors",
+ "model.layers.14.self_attn.o_proj.weight": "model-00029-of-00189.safetensors",
+ "model.layers.14.self_attn.o_proj.weight_scale": "model-00029-of-00189.safetensors",
+ "model.layers.14.self_attn.q_proj.weight": "model-00029-of-00189.safetensors",
+ "model.layers.14.self_attn.q_proj.weight_scale": "model-00029-of-00189.safetensors",
+ "model.layers.14.self_attn.v_proj.weight": "model-00029-of-00189.safetensors",
+ "model.layers.14.self_attn.v_proj.weight_scale": "model-00029-of-00189.safetensors",
+ "model.layers.15.input_layernorm.bias": "model-00033-of-00189.safetensors",
+ "model.layers.15.input_layernorm.weight": "model-00033-of-00189.safetensors",
+ "model.layers.15.mlp.down_proj.weight": "model-00033-of-00189.safetensors",
+ "model.layers.15.mlp.down_proj.weight_scale": "model-00033-of-00189.safetensors",
+ "model.layers.15.mlp.up_proj.weight": "model-00032-of-00189.safetensors",
+ "model.layers.15.mlp.up_proj.weight_scale": "model-00032-of-00189.safetensors",
+ "model.layers.15.post_attention_layernorm.bias": "model-00033-of-00189.safetensors",
+ "model.layers.15.post_attention_layernorm.weight": "model-00033-of-00189.safetensors",
+ "model.layers.15.self_attn.k_proj.weight": "model-00031-of-00189.safetensors",
+ "model.layers.15.self_attn.k_proj.weight_scale": "model-00031-of-00189.safetensors",
+ "model.layers.15.self_attn.o_proj.weight": "model-00031-of-00189.safetensors",
+ "model.layers.15.self_attn.o_proj.weight_scale": "model-00031-of-00189.safetensors",
+ "model.layers.15.self_attn.q_proj.weight": "model-00031-of-00189.safetensors",
+ "model.layers.15.self_attn.q_proj.weight_scale": "model-00031-of-00189.safetensors",
+ "model.layers.15.self_attn.v_proj.weight": "model-00031-of-00189.safetensors",
+ "model.layers.15.self_attn.v_proj.weight_scale": "model-00031-of-00189.safetensors",
+ "model.layers.16.input_layernorm.bias": "model-00035-of-00189.safetensors",
+ "model.layers.16.input_layernorm.weight": "model-00035-of-00189.safetensors",
+ "model.layers.16.mlp.down_proj.weight": "model-00035-of-00189.safetensors",
+ "model.layers.16.mlp.down_proj.weight_scale": "model-00035-of-00189.safetensors",
+ "model.layers.16.mlp.up_proj.weight": "model-00034-of-00189.safetensors",
+ "model.layers.16.mlp.up_proj.weight_scale": "model-00034-of-00189.safetensors",
+ "model.layers.16.post_attention_layernorm.bias": "model-00035-of-00189.safetensors",
+ "model.layers.16.post_attention_layernorm.weight": "model-00035-of-00189.safetensors",
+ "model.layers.16.self_attn.k_proj.weight": "model-00033-of-00189.safetensors",
+ "model.layers.16.self_attn.k_proj.weight_scale": "model-00033-of-00189.safetensors",
+ "model.layers.16.self_attn.o_proj.weight": "model-00033-of-00189.safetensors",
+ "model.layers.16.self_attn.o_proj.weight_scale": "model-00033-of-00189.safetensors",
+ "model.layers.16.self_attn.q_proj.weight": "model-00033-of-00189.safetensors",
+ "model.layers.16.self_attn.q_proj.weight_scale": "model-00033-of-00189.safetensors",
+ "model.layers.16.self_attn.v_proj.weight": "model-00033-of-00189.safetensors",
+ "model.layers.16.self_attn.v_proj.weight_scale": "model-00033-of-00189.safetensors",
+ "model.layers.17.input_layernorm.bias": "model-00037-of-00189.safetensors",
+ "model.layers.17.input_layernorm.weight": "model-00037-of-00189.safetensors",
+ "model.layers.17.mlp.down_proj.weight": "model-00037-of-00189.safetensors",
+ "model.layers.17.mlp.down_proj.weight_scale": "model-00037-of-00189.safetensors",
+ "model.layers.17.mlp.up_proj.weight": "model-00036-of-00189.safetensors",
+ "model.layers.17.mlp.up_proj.weight_scale": "model-00036-of-00189.safetensors",
+ "model.layers.17.post_attention_layernorm.bias": "model-00037-of-00189.safetensors",
+ "model.layers.17.post_attention_layernorm.weight": "model-00037-of-00189.safetensors",
+ "model.layers.17.self_attn.k_proj.weight": "model-00035-of-00189.safetensors",
+ "model.layers.17.self_attn.k_proj.weight_scale": "model-00035-of-00189.safetensors",
+ "model.layers.17.self_attn.o_proj.weight": "model-00035-of-00189.safetensors",
+ "model.layers.17.self_attn.o_proj.weight_scale": "model-00035-of-00189.safetensors",
+ "model.layers.17.self_attn.q_proj.weight": "model-00035-of-00189.safetensors",
+ "model.layers.17.self_attn.q_proj.weight_scale": "model-00035-of-00189.safetensors",
+ "model.layers.17.self_attn.v_proj.weight": "model-00035-of-00189.safetensors",
+ "model.layers.17.self_attn.v_proj.weight_scale": "model-00035-of-00189.safetensors",
+ "model.layers.18.input_layernorm.bias": "model-00039-of-00189.safetensors",
+ "model.layers.18.input_layernorm.weight": "model-00039-of-00189.safetensors",
+ "model.layers.18.mlp.down_proj.weight": "model-00039-of-00189.safetensors",
+ "model.layers.18.mlp.down_proj.weight_scale": "model-00039-of-00189.safetensors",
+ "model.layers.18.mlp.up_proj.weight": "model-00038-of-00189.safetensors",
+ "model.layers.18.mlp.up_proj.weight_scale": "model-00038-of-00189.safetensors",
+ "model.layers.18.post_attention_layernorm.bias": "model-00039-of-00189.safetensors",
+ "model.layers.18.post_attention_layernorm.weight": "model-00039-of-00189.safetensors",
+ "model.layers.18.self_attn.k_proj.weight": "model-00037-of-00189.safetensors",
+ "model.layers.18.self_attn.k_proj.weight_scale": "model-00037-of-00189.safetensors",
+ "model.layers.18.self_attn.o_proj.weight": "model-00037-of-00189.safetensors",
+ "model.layers.18.self_attn.o_proj.weight_scale": "model-00037-of-00189.safetensors",
+ "model.layers.18.self_attn.q_proj.weight": "model-00037-of-00189.safetensors",
+ "model.layers.18.self_attn.q_proj.weight_scale": "model-00037-of-00189.safetensors",
+ "model.layers.18.self_attn.v_proj.weight": "model-00037-of-00189.safetensors",
+ "model.layers.18.self_attn.v_proj.weight_scale": "model-00037-of-00189.safetensors",
+ "model.layers.19.input_layernorm.bias": "model-00041-of-00189.safetensors",
+ "model.layers.19.input_layernorm.weight": "model-00041-of-00189.safetensors",
+ "model.layers.19.mlp.down_proj.weight": "model-00041-of-00189.safetensors",
+ "model.layers.19.mlp.down_proj.weight_scale": "model-00041-of-00189.safetensors",
+ "model.layers.19.mlp.up_proj.weight": "model-00040-of-00189.safetensors",
+ "model.layers.19.mlp.up_proj.weight_scale": "model-00040-of-00189.safetensors",
+ "model.layers.19.post_attention_layernorm.bias": "model-00041-of-00189.safetensors",
+ "model.layers.19.post_attention_layernorm.weight": "model-00041-of-00189.safetensors",
+ "model.layers.19.self_attn.k_proj.weight": "model-00039-of-00189.safetensors",
+ "model.layers.19.self_attn.k_proj.weight_scale": "model-00039-of-00189.safetensors",
+ "model.layers.19.self_attn.o_proj.weight": "model-00039-of-00189.safetensors",
+ "model.layers.19.self_attn.o_proj.weight_scale": "model-00039-of-00189.safetensors",
+ "model.layers.19.self_attn.q_proj.weight": "model-00039-of-00189.safetensors",
+ "model.layers.19.self_attn.q_proj.weight_scale": "model-00039-of-00189.safetensors",
+ "model.layers.19.self_attn.v_proj.weight": "model-00039-of-00189.safetensors",
+ "model.layers.19.self_attn.v_proj.weight_scale": "model-00039-of-00189.safetensors",
+ "model.layers.2.input_layernorm.bias": "model-00007-of-00189.safetensors",
+ "model.layers.2.input_layernorm.weight": "model-00007-of-00189.safetensors",
+ "model.layers.2.mlp.down_proj.weight": "model-00007-of-00189.safetensors",
+ "model.layers.2.mlp.down_proj.weight_scale": "model-00007-of-00189.safetensors",
+ "model.layers.2.mlp.up_proj.weight": "model-00006-of-00189.safetensors",
+ "model.layers.2.mlp.up_proj.weight_scale": "model-00006-of-00189.safetensors",
+ "model.layers.2.post_attention_layernorm.bias": "model-00007-of-00189.safetensors",
+ "model.layers.2.post_attention_layernorm.weight": "model-00007-of-00189.safetensors",
+ "model.layers.2.self_attn.k_proj.weight": "model-00005-of-00189.safetensors",
+ "model.layers.2.self_attn.k_proj.weight_scale": "model-00005-of-00189.safetensors",
+ "model.layers.2.self_attn.o_proj.weight": "model-00005-of-00189.safetensors",
+ "model.layers.2.self_attn.o_proj.weight_scale": "model-00005-of-00189.safetensors",
+ "model.layers.2.self_attn.q_proj.weight": "model-00005-of-00189.safetensors",
+ "model.layers.2.self_attn.q_proj.weight_scale": "model-00005-of-00189.safetensors",
+ "model.layers.2.self_attn.v_proj.weight": "model-00005-of-00189.safetensors",
+ "model.layers.2.self_attn.v_proj.weight_scale": "model-00005-of-00189.safetensors",
+ "model.layers.20.input_layernorm.bias": "model-00043-of-00189.safetensors",
+ "model.layers.20.input_layernorm.weight": "model-00043-of-00189.safetensors",
+ "model.layers.20.mlp.down_proj.weight": "model-00043-of-00189.safetensors",
+ "model.layers.20.mlp.down_proj.weight_scale": "model-00043-of-00189.safetensors",
+ "model.layers.20.mlp.up_proj.weight": "model-00042-of-00189.safetensors",
+ "model.layers.20.mlp.up_proj.weight_scale": "model-00042-of-00189.safetensors",
+ "model.layers.20.post_attention_layernorm.bias": "model-00043-of-00189.safetensors",
+ "model.layers.20.post_attention_layernorm.weight": "model-00043-of-00189.safetensors",
+ "model.layers.20.self_attn.k_proj.weight": "model-00041-of-00189.safetensors",
+ "model.layers.20.self_attn.k_proj.weight_scale": "model-00041-of-00189.safetensors",
+ "model.layers.20.self_attn.o_proj.weight": "model-00041-of-00189.safetensors",
+ "model.layers.20.self_attn.o_proj.weight_scale": "model-00041-of-00189.safetensors",
+ "model.layers.20.self_attn.q_proj.weight": "model-00041-of-00189.safetensors",
+ "model.layers.20.self_attn.q_proj.weight_scale": "model-00041-of-00189.safetensors",
+ "model.layers.20.self_attn.v_proj.weight": "model-00041-of-00189.safetensors",
+ "model.layers.20.self_attn.v_proj.weight_scale": "model-00041-of-00189.safetensors",
+ "model.layers.21.input_layernorm.bias": "model-00045-of-00189.safetensors",
+ "model.layers.21.input_layernorm.weight": "model-00045-of-00189.safetensors",
+ "model.layers.21.mlp.down_proj.weight": "model-00045-of-00189.safetensors",
+ "model.layers.21.mlp.down_proj.weight_scale": "model-00045-of-00189.safetensors",
+ "model.layers.21.mlp.up_proj.weight": "model-00044-of-00189.safetensors",
+ "model.layers.21.mlp.up_proj.weight_scale": "model-00044-of-00189.safetensors",
+ "model.layers.21.post_attention_layernorm.bias": "model-00045-of-00189.safetensors",
+ "model.layers.21.post_attention_layernorm.weight": "model-00045-of-00189.safetensors",
+ "model.layers.21.self_attn.k_proj.weight": "model-00043-of-00189.safetensors",
+ "model.layers.21.self_attn.k_proj.weight_scale": "model-00043-of-00189.safetensors",
+ "model.layers.21.self_attn.o_proj.weight": "model-00043-of-00189.safetensors",
+ "model.layers.21.self_attn.o_proj.weight_scale": "model-00043-of-00189.safetensors",
+ "model.layers.21.self_attn.q_proj.weight": "model-00043-of-00189.safetensors",
+ "model.layers.21.self_attn.q_proj.weight_scale": "model-00043-of-00189.safetensors",
+ "model.layers.21.self_attn.v_proj.weight": "model-00043-of-00189.safetensors",
+ "model.layers.21.self_attn.v_proj.weight_scale": "model-00043-of-00189.safetensors",
+ "model.layers.22.input_layernorm.bias": "model-00047-of-00189.safetensors",
+ "model.layers.22.input_layernorm.weight": "model-00047-of-00189.safetensors",
+ "model.layers.22.mlp.down_proj.weight": "model-00047-of-00189.safetensors",
+ "model.layers.22.mlp.down_proj.weight_scale": "model-00047-of-00189.safetensors",
+ "model.layers.22.mlp.up_proj.weight": "model-00046-of-00189.safetensors",
+ "model.layers.22.mlp.up_proj.weight_scale": "model-00046-of-00189.safetensors",
+ "model.layers.22.post_attention_layernorm.bias": "model-00047-of-00189.safetensors",
+ "model.layers.22.post_attention_layernorm.weight": "model-00047-of-00189.safetensors",
+ "model.layers.22.self_attn.k_proj.weight": "model-00045-of-00189.safetensors",
+ "model.layers.22.self_attn.k_proj.weight_scale": "model-00045-of-00189.safetensors",
+ "model.layers.22.self_attn.o_proj.weight": "model-00045-of-00189.safetensors",
+ "model.layers.22.self_attn.o_proj.weight_scale": "model-00045-of-00189.safetensors",
+ "model.layers.22.self_attn.q_proj.weight": "model-00045-of-00189.safetensors",
+ "model.layers.22.self_attn.q_proj.weight_scale": "model-00045-of-00189.safetensors",
+ "model.layers.22.self_attn.v_proj.weight": "model-00045-of-00189.safetensors",
+ "model.layers.22.self_attn.v_proj.weight_scale": "model-00045-of-00189.safetensors",
+ "model.layers.23.input_layernorm.bias": "model-00049-of-00189.safetensors",
+ "model.layers.23.input_layernorm.weight": "model-00049-of-00189.safetensors",
+ "model.layers.23.mlp.down_proj.weight": "model-00049-of-00189.safetensors",
+ "model.layers.23.mlp.down_proj.weight_scale": "model-00049-of-00189.safetensors",
+ "model.layers.23.mlp.up_proj.weight": "model-00048-of-00189.safetensors",
+ "model.layers.23.mlp.up_proj.weight_scale": "model-00048-of-00189.safetensors",
+ "model.layers.23.post_attention_layernorm.bias": "model-00049-of-00189.safetensors",
+ "model.layers.23.post_attention_layernorm.weight": "model-00049-of-00189.safetensors",
+ "model.layers.23.self_attn.k_proj.weight": "model-00047-of-00189.safetensors",
+ "model.layers.23.self_attn.k_proj.weight_scale": "model-00047-of-00189.safetensors",
+ "model.layers.23.self_attn.o_proj.weight": "model-00047-of-00189.safetensors",
+ "model.layers.23.self_attn.o_proj.weight_scale": "model-00047-of-00189.safetensors",
+ "model.layers.23.self_attn.q_proj.weight": "model-00047-of-00189.safetensors",
+ "model.layers.23.self_attn.q_proj.weight_scale": "model-00047-of-00189.safetensors",
+ "model.layers.23.self_attn.v_proj.weight": "model-00047-of-00189.safetensors",
+ "model.layers.23.self_attn.v_proj.weight_scale": "model-00047-of-00189.safetensors",
+ "model.layers.24.input_layernorm.bias": "model-00051-of-00189.safetensors",
+ "model.layers.24.input_layernorm.weight": "model-00051-of-00189.safetensors",
+ "model.layers.24.mlp.down_proj.weight": "model-00051-of-00189.safetensors",
+ "model.layers.24.mlp.down_proj.weight_scale": "model-00051-of-00189.safetensors",
+ "model.layers.24.mlp.up_proj.weight": "model-00050-of-00189.safetensors",
+ "model.layers.24.mlp.up_proj.weight_scale": "model-00050-of-00189.safetensors",
+ "model.layers.24.post_attention_layernorm.bias": "model-00051-of-00189.safetensors",
+ "model.layers.24.post_attention_layernorm.weight": "model-00051-of-00189.safetensors",
+ "model.layers.24.self_attn.k_proj.weight": "model-00049-of-00189.safetensors",
+ "model.layers.24.self_attn.k_proj.weight_scale": "model-00049-of-00189.safetensors",
+ "model.layers.24.self_attn.o_proj.weight": "model-00049-of-00189.safetensors",
+ "model.layers.24.self_attn.o_proj.weight_scale": "model-00049-of-00189.safetensors",
+ "model.layers.24.self_attn.q_proj.weight": "model-00049-of-00189.safetensors",
+ "model.layers.24.self_attn.q_proj.weight_scale": "model-00049-of-00189.safetensors",
+ "model.layers.24.self_attn.v_proj.weight": "model-00049-of-00189.safetensors",
+ "model.layers.24.self_attn.v_proj.weight_scale": "model-00049-of-00189.safetensors",
+ "model.layers.25.input_layernorm.bias": "model-00053-of-00189.safetensors",
+ "model.layers.25.input_layernorm.weight": "model-00053-of-00189.safetensors",
+ "model.layers.25.mlp.down_proj.weight": "model-00053-of-00189.safetensors",
+ "model.layers.25.mlp.down_proj.weight_scale": "model-00053-of-00189.safetensors",
+ "model.layers.25.mlp.up_proj.weight": "model-00052-of-00189.safetensors",
+ "model.layers.25.mlp.up_proj.weight_scale": "model-00052-of-00189.safetensors",
+ "model.layers.25.post_attention_layernorm.bias": "model-00053-of-00189.safetensors",
+ "model.layers.25.post_attention_layernorm.weight": "model-00053-of-00189.safetensors",
+ "model.layers.25.self_attn.k_proj.weight": "model-00051-of-00189.safetensors",
+ "model.layers.25.self_attn.k_proj.weight_scale": "model-00051-of-00189.safetensors",
+ "model.layers.25.self_attn.o_proj.weight": "model-00051-of-00189.safetensors",
+ "model.layers.25.self_attn.o_proj.weight_scale": "model-00051-of-00189.safetensors",
+ "model.layers.25.self_attn.q_proj.weight": "model-00051-of-00189.safetensors",
+ "model.layers.25.self_attn.q_proj.weight_scale": "model-00051-of-00189.safetensors",
+ "model.layers.25.self_attn.v_proj.weight": "model-00051-of-00189.safetensors",
+ "model.layers.25.self_attn.v_proj.weight_scale": "model-00051-of-00189.safetensors",
+ "model.layers.26.input_layernorm.bias": "model-00055-of-00189.safetensors",
+ "model.layers.26.input_layernorm.weight": "model-00055-of-00189.safetensors",
+ "model.layers.26.mlp.down_proj.weight": "model-00055-of-00189.safetensors",
+ "model.layers.26.mlp.down_proj.weight_scale": "model-00055-of-00189.safetensors",
+ "model.layers.26.mlp.up_proj.weight": "model-00054-of-00189.safetensors",
+ "model.layers.26.mlp.up_proj.weight_scale": "model-00054-of-00189.safetensors",
+ "model.layers.26.post_attention_layernorm.bias": "model-00055-of-00189.safetensors",
+ "model.layers.26.post_attention_layernorm.weight": "model-00055-of-00189.safetensors",
+ "model.layers.26.self_attn.k_proj.weight": "model-00053-of-00189.safetensors",
+ "model.layers.26.self_attn.k_proj.weight_scale": "model-00053-of-00189.safetensors",
+ "model.layers.26.self_attn.o_proj.weight": "model-00053-of-00189.safetensors",
+ "model.layers.26.self_attn.o_proj.weight_scale": "model-00053-of-00189.safetensors",
+ "model.layers.26.self_attn.q_proj.weight": "model-00053-of-00189.safetensors",
+ "model.layers.26.self_attn.q_proj.weight_scale": "model-00053-of-00189.safetensors",
+ "model.layers.26.self_attn.v_proj.weight": "model-00053-of-00189.safetensors",
+ "model.layers.26.self_attn.v_proj.weight_scale": "model-00053-of-00189.safetensors",
+ "model.layers.27.input_layernorm.bias": "model-00057-of-00189.safetensors",
+ "model.layers.27.input_layernorm.weight": "model-00057-of-00189.safetensors",
+ "model.layers.27.mlp.down_proj.weight": "model-00057-of-00189.safetensors",
+ "model.layers.27.mlp.down_proj.weight_scale": "model-00057-of-00189.safetensors",
+ "model.layers.27.mlp.up_proj.weight": "model-00056-of-00189.safetensors",
+ "model.layers.27.mlp.up_proj.weight_scale": "model-00056-of-00189.safetensors",
+ "model.layers.27.post_attention_layernorm.bias": "model-00057-of-00189.safetensors",
+ "model.layers.27.post_attention_layernorm.weight": "model-00057-of-00189.safetensors",
+ "model.layers.27.self_attn.k_proj.weight": "model-00055-of-00189.safetensors",
+ "model.layers.27.self_attn.k_proj.weight_scale": "model-00055-of-00189.safetensors",
+ "model.layers.27.self_attn.o_proj.weight": "model-00055-of-00189.safetensors",
+ "model.layers.27.self_attn.o_proj.weight_scale": "model-00055-of-00189.safetensors",
+ "model.layers.27.self_attn.q_proj.weight": "model-00055-of-00189.safetensors",
+ "model.layers.27.self_attn.q_proj.weight_scale": "model-00055-of-00189.safetensors",
+ "model.layers.27.self_attn.v_proj.weight": "model-00055-of-00189.safetensors",
+ "model.layers.27.self_attn.v_proj.weight_scale": "model-00055-of-00189.safetensors",
+ "model.layers.28.input_layernorm.bias": "model-00059-of-00189.safetensors",
+ "model.layers.28.input_layernorm.weight": "model-00059-of-00189.safetensors",
+ "model.layers.28.mlp.down_proj.weight": "model-00059-of-00189.safetensors",
+ "model.layers.28.mlp.down_proj.weight_scale": "model-00059-of-00189.safetensors",
+ "model.layers.28.mlp.up_proj.weight": "model-00058-of-00189.safetensors",
+ "model.layers.28.mlp.up_proj.weight_scale": "model-00058-of-00189.safetensors",
+ "model.layers.28.post_attention_layernorm.bias": "model-00059-of-00189.safetensors",
+ "model.layers.28.post_attention_layernorm.weight": "model-00059-of-00189.safetensors",
+ "model.layers.28.self_attn.k_proj.weight": "model-00057-of-00189.safetensors",
+ "model.layers.28.self_attn.k_proj.weight_scale": "model-00057-of-00189.safetensors",
+ "model.layers.28.self_attn.o_proj.weight": "model-00057-of-00189.safetensors",
+ "model.layers.28.self_attn.o_proj.weight_scale": "model-00057-of-00189.safetensors",
+ "model.layers.28.self_attn.q_proj.weight": "model-00057-of-00189.safetensors",
+ "model.layers.28.self_attn.q_proj.weight_scale": "model-00057-of-00189.safetensors",
+ "model.layers.28.self_attn.v_proj.weight": "model-00057-of-00189.safetensors",
+ "model.layers.28.self_attn.v_proj.weight_scale": "model-00057-of-00189.safetensors",
+ "model.layers.29.input_layernorm.bias": "model-00061-of-00189.safetensors",
+ "model.layers.29.input_layernorm.weight": "model-00061-of-00189.safetensors",
+ "model.layers.29.mlp.down_proj.weight": "model-00061-of-00189.safetensors",
+ "model.layers.29.mlp.down_proj.weight_scale": "model-00061-of-00189.safetensors",
+ "model.layers.29.mlp.up_proj.weight": "model-00060-of-00189.safetensors",
+ "model.layers.29.mlp.up_proj.weight_scale": "model-00060-of-00189.safetensors",
+ "model.layers.29.post_attention_layernorm.bias": "model-00061-of-00189.safetensors",
+ "model.layers.29.post_attention_layernorm.weight": "model-00061-of-00189.safetensors",
+ "model.layers.29.self_attn.k_proj.weight": "model-00059-of-00189.safetensors",
+ "model.layers.29.self_attn.k_proj.weight_scale": "model-00059-of-00189.safetensors",
+ "model.layers.29.self_attn.o_proj.weight": "model-00059-of-00189.safetensors",
+ "model.layers.29.self_attn.o_proj.weight_scale": "model-00059-of-00189.safetensors",
+ "model.layers.29.self_attn.q_proj.weight": "model-00059-of-00189.safetensors",
+ "model.layers.29.self_attn.q_proj.weight_scale": "model-00059-of-00189.safetensors",
+ "model.layers.29.self_attn.v_proj.weight": "model-00059-of-00189.safetensors",
+ "model.layers.29.self_attn.v_proj.weight_scale": "model-00059-of-00189.safetensors",
+ "model.layers.3.input_layernorm.bias": "model-00009-of-00189.safetensors",
+ "model.layers.3.input_layernorm.weight": "model-00009-of-00189.safetensors",
+ "model.layers.3.mlp.down_proj.weight": "model-00009-of-00189.safetensors",
+ "model.layers.3.mlp.down_proj.weight_scale": "model-00009-of-00189.safetensors",
+ "model.layers.3.mlp.up_proj.weight": "model-00008-of-00189.safetensors",
+ "model.layers.3.mlp.up_proj.weight_scale": "model-00008-of-00189.safetensors",
+ "model.layers.3.post_attention_layernorm.bias": "model-00009-of-00189.safetensors",
+ "model.layers.3.post_attention_layernorm.weight": "model-00009-of-00189.safetensors",
+ "model.layers.3.self_attn.k_proj.weight": "model-00007-of-00189.safetensors",
+ "model.layers.3.self_attn.k_proj.weight_scale": "model-00007-of-00189.safetensors",
+ "model.layers.3.self_attn.o_proj.weight": "model-00007-of-00189.safetensors",
+ "model.layers.3.self_attn.o_proj.weight_scale": "model-00007-of-00189.safetensors",
+ "model.layers.3.self_attn.q_proj.weight": "model-00007-of-00189.safetensors",
+ "model.layers.3.self_attn.q_proj.weight_scale": "model-00007-of-00189.safetensors",
+ "model.layers.3.self_attn.v_proj.weight": "model-00007-of-00189.safetensors",
+ "model.layers.3.self_attn.v_proj.weight_scale": "model-00007-of-00189.safetensors",
+ "model.layers.30.input_layernorm.bias": "model-00063-of-00189.safetensors",
+ "model.layers.30.input_layernorm.weight": "model-00063-of-00189.safetensors",
+ "model.layers.30.mlp.down_proj.weight": "model-00063-of-00189.safetensors",
+ "model.layers.30.mlp.down_proj.weight_scale": "model-00063-of-00189.safetensors",
+ "model.layers.30.mlp.up_proj.weight": "model-00062-of-00189.safetensors",
+ "model.layers.30.mlp.up_proj.weight_scale": "model-00062-of-00189.safetensors",
+ "model.layers.30.post_attention_layernorm.bias": "model-00063-of-00189.safetensors",
+ "model.layers.30.post_attention_layernorm.weight": "model-00063-of-00189.safetensors",
+ "model.layers.30.self_attn.k_proj.weight": "model-00061-of-00189.safetensors",
+ "model.layers.30.self_attn.k_proj.weight_scale": "model-00061-of-00189.safetensors",
+ "model.layers.30.self_attn.o_proj.weight": "model-00061-of-00189.safetensors",
+ "model.layers.30.self_attn.o_proj.weight_scale": "model-00061-of-00189.safetensors",
+ "model.layers.30.self_attn.q_proj.weight": "model-00061-of-00189.safetensors",
+ "model.layers.30.self_attn.q_proj.weight_scale": "model-00061-of-00189.safetensors",
+ "model.layers.30.self_attn.v_proj.weight": "model-00061-of-00189.safetensors",
+ "model.layers.30.self_attn.v_proj.weight_scale": "model-00061-of-00189.safetensors",
+ "model.layers.31.input_layernorm.bias": "model-00065-of-00189.safetensors",
+ "model.layers.31.input_layernorm.weight": "model-00065-of-00189.safetensors",
+ "model.layers.31.mlp.down_proj.weight": "model-00065-of-00189.safetensors",
+ "model.layers.31.mlp.down_proj.weight_scale": "model-00065-of-00189.safetensors",
+ "model.layers.31.mlp.up_proj.weight": "model-00064-of-00189.safetensors",
+ "model.layers.31.mlp.up_proj.weight_scale": "model-00064-of-00189.safetensors",
+ "model.layers.31.post_attention_layernorm.bias": "model-00065-of-00189.safetensors",
+ "model.layers.31.post_attention_layernorm.weight": "model-00065-of-00189.safetensors",
+ "model.layers.31.self_attn.k_proj.weight": "model-00063-of-00189.safetensors",
+ "model.layers.31.self_attn.k_proj.weight_scale": "model-00063-of-00189.safetensors",
+ "model.layers.31.self_attn.o_proj.weight": "model-00063-of-00189.safetensors",
+ "model.layers.31.self_attn.o_proj.weight_scale": "model-00063-of-00189.safetensors",
+ "model.layers.31.self_attn.q_proj.weight": "model-00063-of-00189.safetensors",
+ "model.layers.31.self_attn.q_proj.weight_scale": "model-00063-of-00189.safetensors",
+ "model.layers.31.self_attn.v_proj.weight": "model-00063-of-00189.safetensors",
+ "model.layers.31.self_attn.v_proj.weight_scale": "model-00063-of-00189.safetensors",
+ "model.layers.32.input_layernorm.bias": "model-00067-of-00189.safetensors",
+ "model.layers.32.input_layernorm.weight": "model-00067-of-00189.safetensors",
+ "model.layers.32.mlp.down_proj.weight": "model-00067-of-00189.safetensors",
+ "model.layers.32.mlp.down_proj.weight_scale": "model-00067-of-00189.safetensors",
+ "model.layers.32.mlp.up_proj.weight": "model-00066-of-00189.safetensors",
+ "model.layers.32.mlp.up_proj.weight_scale": "model-00066-of-00189.safetensors",
+ "model.layers.32.post_attention_layernorm.bias": "model-00067-of-00189.safetensors",
+ "model.layers.32.post_attention_layernorm.weight": "model-00067-of-00189.safetensors",
+ "model.layers.32.self_attn.k_proj.weight": "model-00065-of-00189.safetensors",
+ "model.layers.32.self_attn.k_proj.weight_scale": "model-00065-of-00189.safetensors",
+ "model.layers.32.self_attn.o_proj.weight": "model-00065-of-00189.safetensors",
+ "model.layers.32.self_attn.o_proj.weight_scale": "model-00065-of-00189.safetensors",
+ "model.layers.32.self_attn.q_proj.weight": "model-00065-of-00189.safetensors",
+ "model.layers.32.self_attn.q_proj.weight_scale": "model-00065-of-00189.safetensors",
+ "model.layers.32.self_attn.v_proj.weight": "model-00065-of-00189.safetensors",
+ "model.layers.32.self_attn.v_proj.weight_scale": "model-00065-of-00189.safetensors",
+ "model.layers.33.input_layernorm.bias": "model-00069-of-00189.safetensors",
+ "model.layers.33.input_layernorm.weight": "model-00069-of-00189.safetensors",
+ "model.layers.33.mlp.down_proj.weight": "model-00069-of-00189.safetensors",
+ "model.layers.33.mlp.down_proj.weight_scale": "model-00069-of-00189.safetensors",
+ "model.layers.33.mlp.up_proj.weight": "model-00068-of-00189.safetensors",
+ "model.layers.33.mlp.up_proj.weight_scale": "model-00068-of-00189.safetensors",
+ "model.layers.33.post_attention_layernorm.bias": "model-00069-of-00189.safetensors",
+ "model.layers.33.post_attention_layernorm.weight": "model-00069-of-00189.safetensors",
+ "model.layers.33.self_attn.k_proj.weight": "model-00067-of-00189.safetensors",
+ "model.layers.33.self_attn.k_proj.weight_scale": "model-00067-of-00189.safetensors",
+ "model.layers.33.self_attn.o_proj.weight": "model-00067-of-00189.safetensors",
+ "model.layers.33.self_attn.o_proj.weight_scale": "model-00067-of-00189.safetensors",
+ "model.layers.33.self_attn.q_proj.weight": "model-00067-of-00189.safetensors",
+ "model.layers.33.self_attn.q_proj.weight_scale": "model-00067-of-00189.safetensors",
+ "model.layers.33.self_attn.v_proj.weight": "model-00067-of-00189.safetensors",
+ "model.layers.33.self_attn.v_proj.weight_scale": "model-00067-of-00189.safetensors",
+ "model.layers.34.input_layernorm.bias": "model-00071-of-00189.safetensors",
+ "model.layers.34.input_layernorm.weight": "model-00071-of-00189.safetensors",
+ "model.layers.34.mlp.down_proj.weight": "model-00071-of-00189.safetensors",
+ "model.layers.34.mlp.down_proj.weight_scale": "model-00071-of-00189.safetensors",
+ "model.layers.34.mlp.up_proj.weight": "model-00070-of-00189.safetensors",
+ "model.layers.34.mlp.up_proj.weight_scale": "model-00070-of-00189.safetensors",
+ "model.layers.34.post_attention_layernorm.bias": "model-00071-of-00189.safetensors",
+ "model.layers.34.post_attention_layernorm.weight": "model-00071-of-00189.safetensors",
+ "model.layers.34.self_attn.k_proj.weight": "model-00069-of-00189.safetensors",
+ "model.layers.34.self_attn.k_proj.weight_scale": "model-00069-of-00189.safetensors",
+ "model.layers.34.self_attn.o_proj.weight": "model-00069-of-00189.safetensors",
+ "model.layers.34.self_attn.o_proj.weight_scale": "model-00069-of-00189.safetensors",
+ "model.layers.34.self_attn.q_proj.weight": "model-00069-of-00189.safetensors",
+ "model.layers.34.self_attn.q_proj.weight_scale": "model-00069-of-00189.safetensors",
+ "model.layers.34.self_attn.v_proj.weight": "model-00069-of-00189.safetensors",
+ "model.layers.34.self_attn.v_proj.weight_scale": "model-00069-of-00189.safetensors",
+ "model.layers.35.input_layernorm.bias": "model-00073-of-00189.safetensors",
+ "model.layers.35.input_layernorm.weight": "model-00073-of-00189.safetensors",
+ "model.layers.35.mlp.down_proj.weight": "model-00073-of-00189.safetensors",
+ "model.layers.35.mlp.down_proj.weight_scale": "model-00073-of-00189.safetensors",
+ "model.layers.35.mlp.up_proj.weight": "model-00072-of-00189.safetensors",
+ "model.layers.35.mlp.up_proj.weight_scale": "model-00072-of-00189.safetensors",
+ "model.layers.35.post_attention_layernorm.bias": "model-00073-of-00189.safetensors",
+ "model.layers.35.post_attention_layernorm.weight": "model-00073-of-00189.safetensors",
+ "model.layers.35.self_attn.k_proj.weight": "model-00071-of-00189.safetensors",
+ "model.layers.35.self_attn.k_proj.weight_scale": "model-00071-of-00189.safetensors",
+ "model.layers.35.self_attn.o_proj.weight": "model-00071-of-00189.safetensors",
+ "model.layers.35.self_attn.o_proj.weight_scale": "model-00071-of-00189.safetensors",
+ "model.layers.35.self_attn.q_proj.weight": "model-00071-of-00189.safetensors",
+ "model.layers.35.self_attn.q_proj.weight_scale": "model-00071-of-00189.safetensors",
+ "model.layers.35.self_attn.v_proj.weight": "model-00071-of-00189.safetensors",
+ "model.layers.35.self_attn.v_proj.weight_scale": "model-00071-of-00189.safetensors",
+ "model.layers.36.input_layernorm.bias": "model-00075-of-00189.safetensors",
+ "model.layers.36.input_layernorm.weight": "model-00075-of-00189.safetensors",
+ "model.layers.36.mlp.down_proj.weight": "model-00075-of-00189.safetensors",
+ "model.layers.36.mlp.down_proj.weight_scale": "model-00075-of-00189.safetensors",
+ "model.layers.36.mlp.up_proj.weight": "model-00074-of-00189.safetensors",
+ "model.layers.36.mlp.up_proj.weight_scale": "model-00074-of-00189.safetensors",
+ "model.layers.36.post_attention_layernorm.bias": "model-00075-of-00189.safetensors",
+ "model.layers.36.post_attention_layernorm.weight": "model-00075-of-00189.safetensors",
+ "model.layers.36.self_attn.k_proj.weight": "model-00073-of-00189.safetensors",
+ "model.layers.36.self_attn.k_proj.weight_scale": "model-00073-of-00189.safetensors",
+ "model.layers.36.self_attn.o_proj.weight": "model-00073-of-00189.safetensors",
+ "model.layers.36.self_attn.o_proj.weight_scale": "model-00073-of-00189.safetensors",
+ "model.layers.36.self_attn.q_proj.weight": "model-00073-of-00189.safetensors",
+ "model.layers.36.self_attn.q_proj.weight_scale": "model-00073-of-00189.safetensors",
+ "model.layers.36.self_attn.v_proj.weight": "model-00073-of-00189.safetensors",
+ "model.layers.36.self_attn.v_proj.weight_scale": "model-00073-of-00189.safetensors",
+ "model.layers.37.input_layernorm.bias": "model-00077-of-00189.safetensors",
+ "model.layers.37.input_layernorm.weight": "model-00077-of-00189.safetensors",
+ "model.layers.37.mlp.down_proj.weight": "model-00077-of-00189.safetensors",
+ "model.layers.37.mlp.down_proj.weight_scale": "model-00077-of-00189.safetensors",
+ "model.layers.37.mlp.up_proj.weight": "model-00076-of-00189.safetensors",
+ "model.layers.37.mlp.up_proj.weight_scale": "model-00076-of-00189.safetensors",
+ "model.layers.37.post_attention_layernorm.bias": "model-00077-of-00189.safetensors",
+ "model.layers.37.post_attention_layernorm.weight": "model-00077-of-00189.safetensors",
+ "model.layers.37.self_attn.k_proj.weight": "model-00075-of-00189.safetensors",
+ "model.layers.37.self_attn.k_proj.weight_scale": "model-00075-of-00189.safetensors",
+ "model.layers.37.self_attn.o_proj.weight": "model-00075-of-00189.safetensors",
+ "model.layers.37.self_attn.o_proj.weight_scale": "model-00075-of-00189.safetensors",
+ "model.layers.37.self_attn.q_proj.weight": "model-00075-of-00189.safetensors",
+ "model.layers.37.self_attn.q_proj.weight_scale": "model-00075-of-00189.safetensors",
+ "model.layers.37.self_attn.v_proj.weight": "model-00075-of-00189.safetensors",
+ "model.layers.37.self_attn.v_proj.weight_scale": "model-00075-of-00189.safetensors",
+ "model.layers.38.input_layernorm.bias": "model-00079-of-00189.safetensors",
+ "model.layers.38.input_layernorm.weight": "model-00079-of-00189.safetensors",
+ "model.layers.38.mlp.down_proj.weight": "model-00079-of-00189.safetensors",
+ "model.layers.38.mlp.down_proj.weight_scale": "model-00079-of-00189.safetensors",
+ "model.layers.38.mlp.up_proj.weight": "model-00078-of-00189.safetensors",
+ "model.layers.38.mlp.up_proj.weight_scale": "model-00078-of-00189.safetensors",
+ "model.layers.38.post_attention_layernorm.bias": "model-00079-of-00189.safetensors",
+ "model.layers.38.post_attention_layernorm.weight": "model-00079-of-00189.safetensors",
+ "model.layers.38.self_attn.k_proj.weight": "model-00077-of-00189.safetensors",
+ "model.layers.38.self_attn.k_proj.weight_scale": "model-00077-of-00189.safetensors",
+ "model.layers.38.self_attn.o_proj.weight": "model-00077-of-00189.safetensors",
+ "model.layers.38.self_attn.o_proj.weight_scale": "model-00077-of-00189.safetensors",
+ "model.layers.38.self_attn.q_proj.weight": "model-00077-of-00189.safetensors",
+ "model.layers.38.self_attn.q_proj.weight_scale": "model-00077-of-00189.safetensors",
+ "model.layers.38.self_attn.v_proj.weight": "model-00077-of-00189.safetensors",
+ "model.layers.38.self_attn.v_proj.weight_scale": "model-00077-of-00189.safetensors",
+ "model.layers.39.input_layernorm.bias": "model-00081-of-00189.safetensors",
+ "model.layers.39.input_layernorm.weight": "model-00081-of-00189.safetensors",
+ "model.layers.39.mlp.down_proj.weight": "model-00081-of-00189.safetensors",
+ "model.layers.39.mlp.down_proj.weight_scale": "model-00081-of-00189.safetensors",
+ "model.layers.39.mlp.up_proj.weight": "model-00080-of-00189.safetensors",
+ "model.layers.39.mlp.up_proj.weight_scale": "model-00080-of-00189.safetensors",
+ "model.layers.39.post_attention_layernorm.bias": "model-00081-of-00189.safetensors",
+ "model.layers.39.post_attention_layernorm.weight": "model-00081-of-00189.safetensors",
+ "model.layers.39.self_attn.k_proj.weight": "model-00079-of-00189.safetensors",
+ "model.layers.39.self_attn.k_proj.weight_scale": "model-00079-of-00189.safetensors",
+ "model.layers.39.self_attn.o_proj.weight": "model-00079-of-00189.safetensors",
+ "model.layers.39.self_attn.o_proj.weight_scale": "model-00079-of-00189.safetensors",
+ "model.layers.39.self_attn.q_proj.weight": "model-00079-of-00189.safetensors",
+ "model.layers.39.self_attn.q_proj.weight_scale": "model-00079-of-00189.safetensors",
+ "model.layers.39.self_attn.v_proj.weight": "model-00079-of-00189.safetensors",
+ "model.layers.39.self_attn.v_proj.weight_scale": "model-00079-of-00189.safetensors",
+ "model.layers.4.input_layernorm.bias": "model-00011-of-00189.safetensors",
+ "model.layers.4.input_layernorm.weight": "model-00011-of-00189.safetensors",
+ "model.layers.4.mlp.down_proj.weight": "model-00011-of-00189.safetensors",
+ "model.layers.4.mlp.down_proj.weight_scale": "model-00011-of-00189.safetensors",
+ "model.layers.4.mlp.up_proj.weight": "model-00010-of-00189.safetensors",
+ "model.layers.4.mlp.up_proj.weight_scale": "model-00010-of-00189.safetensors",
+ "model.layers.4.post_attention_layernorm.bias": "model-00011-of-00189.safetensors",
+ "model.layers.4.post_attention_layernorm.weight": "model-00011-of-00189.safetensors",
+ "model.layers.4.self_attn.k_proj.weight": "model-00009-of-00189.safetensors",
+ "model.layers.4.self_attn.k_proj.weight_scale": "model-00009-of-00189.safetensors",
+ "model.layers.4.self_attn.o_proj.weight": "model-00009-of-00189.safetensors",
+ "model.layers.4.self_attn.o_proj.weight_scale": "model-00009-of-00189.safetensors",
+ "model.layers.4.self_attn.q_proj.weight": "model-00009-of-00189.safetensors",
+ "model.layers.4.self_attn.q_proj.weight_scale": "model-00009-of-00189.safetensors",
+ "model.layers.4.self_attn.v_proj.weight": "model-00009-of-00189.safetensors",
+ "model.layers.4.self_attn.v_proj.weight_scale": "model-00009-of-00189.safetensors",
+ "model.layers.40.input_layernorm.bias": "model-00083-of-00189.safetensors",
+ "model.layers.40.input_layernorm.weight": "model-00083-of-00189.safetensors",
+ "model.layers.40.mlp.down_proj.weight": "model-00083-of-00189.safetensors",
+ "model.layers.40.mlp.down_proj.weight_scale": "model-00083-of-00189.safetensors",
+ "model.layers.40.mlp.up_proj.weight": "model-00082-of-00189.safetensors",
+ "model.layers.40.mlp.up_proj.weight_scale": "model-00082-of-00189.safetensors",
+ "model.layers.40.post_attention_layernorm.bias": "model-00083-of-00189.safetensors",
+ "model.layers.40.post_attention_layernorm.weight": "model-00083-of-00189.safetensors",
+ "model.layers.40.self_attn.k_proj.weight": "model-00081-of-00189.safetensors",
+ "model.layers.40.self_attn.k_proj.weight_scale": "model-00081-of-00189.safetensors",
+ "model.layers.40.self_attn.o_proj.weight": "model-00081-of-00189.safetensors",
+ "model.layers.40.self_attn.o_proj.weight_scale": "model-00081-of-00189.safetensors",
+ "model.layers.40.self_attn.q_proj.weight": "model-00081-of-00189.safetensors",
+ "model.layers.40.self_attn.q_proj.weight_scale": "model-00081-of-00189.safetensors",
+ "model.layers.40.self_attn.v_proj.weight": "model-00081-of-00189.safetensors",
+ "model.layers.40.self_attn.v_proj.weight_scale": "model-00081-of-00189.safetensors",
+ "model.layers.41.input_layernorm.bias": "model-00085-of-00189.safetensors",
+ "model.layers.41.input_layernorm.weight": "model-00085-of-00189.safetensors",
+ "model.layers.41.mlp.down_proj.weight": "model-00085-of-00189.safetensors",
+ "model.layers.41.mlp.down_proj.weight_scale": "model-00085-of-00189.safetensors",
+ "model.layers.41.mlp.up_proj.weight": "model-00084-of-00189.safetensors",
+ "model.layers.41.mlp.up_proj.weight_scale": "model-00084-of-00189.safetensors",
+ "model.layers.41.post_attention_layernorm.bias": "model-00085-of-00189.safetensors",
+ "model.layers.41.post_attention_layernorm.weight": "model-00085-of-00189.safetensors",
+ "model.layers.41.self_attn.k_proj.weight": "model-00083-of-00189.safetensors",
+ "model.layers.41.self_attn.k_proj.weight_scale": "model-00083-of-00189.safetensors",
+ "model.layers.41.self_attn.o_proj.weight": "model-00083-of-00189.safetensors",
+ "model.layers.41.self_attn.o_proj.weight_scale": "model-00083-of-00189.safetensors",
+ "model.layers.41.self_attn.q_proj.weight": "model-00083-of-00189.safetensors",
+ "model.layers.41.self_attn.q_proj.weight_scale": "model-00083-of-00189.safetensors",
+ "model.layers.41.self_attn.v_proj.weight": "model-00083-of-00189.safetensors",
+ "model.layers.41.self_attn.v_proj.weight_scale": "model-00083-of-00189.safetensors",
+ "model.layers.42.input_layernorm.bias": "model-00087-of-00189.safetensors",
+ "model.layers.42.input_layernorm.weight": "model-00087-of-00189.safetensors",
+ "model.layers.42.mlp.down_proj.weight": "model-00087-of-00189.safetensors",
+ "model.layers.42.mlp.down_proj.weight_scale": "model-00087-of-00189.safetensors",
+ "model.layers.42.mlp.up_proj.weight": "model-00086-of-00189.safetensors",
+ "model.layers.42.mlp.up_proj.weight_scale": "model-00086-of-00189.safetensors",
+ "model.layers.42.post_attention_layernorm.bias": "model-00087-of-00189.safetensors",
+ "model.layers.42.post_attention_layernorm.weight": "model-00087-of-00189.safetensors",
+ "model.layers.42.self_attn.k_proj.weight": "model-00085-of-00189.safetensors",
+ "model.layers.42.self_attn.k_proj.weight_scale": "model-00085-of-00189.safetensors",
+ "model.layers.42.self_attn.o_proj.weight": "model-00085-of-00189.safetensors",
+ "model.layers.42.self_attn.o_proj.weight_scale": "model-00085-of-00189.safetensors",
+ "model.layers.42.self_attn.q_proj.weight": "model-00085-of-00189.safetensors",
+ "model.layers.42.self_attn.q_proj.weight_scale": "model-00085-of-00189.safetensors",
+ "model.layers.42.self_attn.v_proj.weight": "model-00085-of-00189.safetensors",
+ "model.layers.42.self_attn.v_proj.weight_scale": "model-00085-of-00189.safetensors",
+ "model.layers.43.input_layernorm.bias": "model-00089-of-00189.safetensors",
+ "model.layers.43.input_layernorm.weight": "model-00089-of-00189.safetensors",
+ "model.layers.43.mlp.down_proj.weight": "model-00089-of-00189.safetensors",
+ "model.layers.43.mlp.down_proj.weight_scale": "model-00089-of-00189.safetensors",
+ "model.layers.43.mlp.up_proj.weight": "model-00088-of-00189.safetensors",
+ "model.layers.43.mlp.up_proj.weight_scale": "model-00088-of-00189.safetensors",
+ "model.layers.43.post_attention_layernorm.bias": "model-00089-of-00189.safetensors",
+ "model.layers.43.post_attention_layernorm.weight": "model-00089-of-00189.safetensors",
+ "model.layers.43.self_attn.k_proj.weight": "model-00087-of-00189.safetensors",
+ "model.layers.43.self_attn.k_proj.weight_scale": "model-00087-of-00189.safetensors",
+ "model.layers.43.self_attn.o_proj.weight": "model-00087-of-00189.safetensors",
+ "model.layers.43.self_attn.o_proj.weight_scale": "model-00087-of-00189.safetensors",
+ "model.layers.43.self_attn.q_proj.weight": "model-00087-of-00189.safetensors",
+ "model.layers.43.self_attn.q_proj.weight_scale": "model-00087-of-00189.safetensors",
+ "model.layers.43.self_attn.v_proj.weight": "model-00087-of-00189.safetensors",
+ "model.layers.43.self_attn.v_proj.weight_scale": "model-00087-of-00189.safetensors",
+ "model.layers.44.input_layernorm.bias": "model-00091-of-00189.safetensors",
+ "model.layers.44.input_layernorm.weight": "model-00091-of-00189.safetensors",
+ "model.layers.44.mlp.down_proj.weight": "model-00091-of-00189.safetensors",
+ "model.layers.44.mlp.down_proj.weight_scale": "model-00091-of-00189.safetensors",
+ "model.layers.44.mlp.up_proj.weight": "model-00090-of-00189.safetensors",
+ "model.layers.44.mlp.up_proj.weight_scale": "model-00090-of-00189.safetensors",
+ "model.layers.44.post_attention_layernorm.bias": "model-00091-of-00189.safetensors",
+ "model.layers.44.post_attention_layernorm.weight": "model-00091-of-00189.safetensors",
+ "model.layers.44.self_attn.k_proj.weight": "model-00089-of-00189.safetensors",
+ "model.layers.44.self_attn.k_proj.weight_scale": "model-00089-of-00189.safetensors",
+ "model.layers.44.self_attn.o_proj.weight": "model-00089-of-00189.safetensors",
+ "model.layers.44.self_attn.o_proj.weight_scale": "model-00089-of-00189.safetensors",
+ "model.layers.44.self_attn.q_proj.weight": "model-00089-of-00189.safetensors",
+ "model.layers.44.self_attn.q_proj.weight_scale": "model-00089-of-00189.safetensors",
+ "model.layers.44.self_attn.v_proj.weight": "model-00089-of-00189.safetensors",
+ "model.layers.44.self_attn.v_proj.weight_scale": "model-00089-of-00189.safetensors",
+ "model.layers.45.input_layernorm.bias": "model-00093-of-00189.safetensors",
+ "model.layers.45.input_layernorm.weight": "model-00093-of-00189.safetensors",
+ "model.layers.45.mlp.down_proj.weight": "model-00093-of-00189.safetensors",
+ "model.layers.45.mlp.down_proj.weight_scale": "model-00093-of-00189.safetensors",
+ "model.layers.45.mlp.up_proj.weight": "model-00092-of-00189.safetensors",
+ "model.layers.45.mlp.up_proj.weight_scale": "model-00092-of-00189.safetensors",
+ "model.layers.45.post_attention_layernorm.bias": "model-00093-of-00189.safetensors",
+ "model.layers.45.post_attention_layernorm.weight": "model-00093-of-00189.safetensors",
+ "model.layers.45.self_attn.k_proj.weight": "model-00091-of-00189.safetensors",
+ "model.layers.45.self_attn.k_proj.weight_scale": "model-00091-of-00189.safetensors",
+ "model.layers.45.self_attn.o_proj.weight": "model-00091-of-00189.safetensors",
+ "model.layers.45.self_attn.o_proj.weight_scale": "model-00091-of-00189.safetensors",
+ "model.layers.45.self_attn.q_proj.weight": "model-00091-of-00189.safetensors",
+ "model.layers.45.self_attn.q_proj.weight_scale": "model-00091-of-00189.safetensors",
+ "model.layers.45.self_attn.v_proj.weight": "model-00091-of-00189.safetensors",
+ "model.layers.45.self_attn.v_proj.weight_scale": "model-00091-of-00189.safetensors",
+ "model.layers.46.input_layernorm.bias": "model-00095-of-00189.safetensors",
+ "model.layers.46.input_layernorm.weight": "model-00095-of-00189.safetensors",
+ "model.layers.46.mlp.down_proj.weight": "model-00095-of-00189.safetensors",
+ "model.layers.46.mlp.down_proj.weight_scale": "model-00095-of-00189.safetensors",
+ "model.layers.46.mlp.up_proj.weight": "model-00094-of-00189.safetensors",
+ "model.layers.46.mlp.up_proj.weight_scale": "model-00094-of-00189.safetensors",
+ "model.layers.46.post_attention_layernorm.bias": "model-00095-of-00189.safetensors",
+ "model.layers.46.post_attention_layernorm.weight": "model-00095-of-00189.safetensors",
+ "model.layers.46.self_attn.k_proj.weight": "model-00093-of-00189.safetensors",
+ "model.layers.46.self_attn.k_proj.weight_scale": "model-00093-of-00189.safetensors",
+ "model.layers.46.self_attn.o_proj.weight": "model-00093-of-00189.safetensors",
+ "model.layers.46.self_attn.o_proj.weight_scale": "model-00093-of-00189.safetensors",
+ "model.layers.46.self_attn.q_proj.weight": "model-00093-of-00189.safetensors",
+ "model.layers.46.self_attn.q_proj.weight_scale": "model-00093-of-00189.safetensors",
+ "model.layers.46.self_attn.v_proj.weight": "model-00093-of-00189.safetensors",
+ "model.layers.46.self_attn.v_proj.weight_scale": "model-00093-of-00189.safetensors",
+ "model.layers.47.input_layernorm.bias": "model-00097-of-00189.safetensors",
+ "model.layers.47.input_layernorm.weight": "model-00097-of-00189.safetensors",
+ "model.layers.47.mlp.down_proj.weight": "model-00097-of-00189.safetensors",
+ "model.layers.47.mlp.down_proj.weight_scale": "model-00097-of-00189.safetensors",
+ "model.layers.47.mlp.up_proj.weight": "model-00096-of-00189.safetensors",
+ "model.layers.47.mlp.up_proj.weight_scale": "model-00096-of-00189.safetensors",
+ "model.layers.47.post_attention_layernorm.bias": "model-00097-of-00189.safetensors",
+ "model.layers.47.post_attention_layernorm.weight": "model-00097-of-00189.safetensors",
+ "model.layers.47.self_attn.k_proj.weight": "model-00095-of-00189.safetensors",
+ "model.layers.47.self_attn.k_proj.weight_scale": "model-00095-of-00189.safetensors",
+ "model.layers.47.self_attn.o_proj.weight": "model-00095-of-00189.safetensors",
+ "model.layers.47.self_attn.o_proj.weight_scale": "model-00095-of-00189.safetensors",
+ "model.layers.47.self_attn.q_proj.weight": "model-00095-of-00189.safetensors",
+ "model.layers.47.self_attn.q_proj.weight_scale": "model-00095-of-00189.safetensors",
+ "model.layers.47.self_attn.v_proj.weight": "model-00095-of-00189.safetensors",
+ "model.layers.47.self_attn.v_proj.weight_scale": "model-00095-of-00189.safetensors",
+ "model.layers.48.input_layernorm.bias": "model-00099-of-00189.safetensors",
+ "model.layers.48.input_layernorm.weight": "model-00099-of-00189.safetensors",
+ "model.layers.48.mlp.down_proj.weight": "model-00099-of-00189.safetensors",
+ "model.layers.48.mlp.down_proj.weight_scale": "model-00099-of-00189.safetensors",
+ "model.layers.48.mlp.up_proj.weight": "model-00098-of-00189.safetensors",
+ "model.layers.48.mlp.up_proj.weight_scale": "model-00098-of-00189.safetensors",
+ "model.layers.48.post_attention_layernorm.bias": "model-00099-of-00189.safetensors",
+ "model.layers.48.post_attention_layernorm.weight": "model-00099-of-00189.safetensors",
+ "model.layers.48.self_attn.k_proj.weight": "model-00097-of-00189.safetensors",
+ "model.layers.48.self_attn.k_proj.weight_scale": "model-00097-of-00189.safetensors",
+ "model.layers.48.self_attn.o_proj.weight": "model-00097-of-00189.safetensors",
+ "model.layers.48.self_attn.o_proj.weight_scale": "model-00097-of-00189.safetensors",
+ "model.layers.48.self_attn.q_proj.weight": "model-00097-of-00189.safetensors",
+ "model.layers.48.self_attn.q_proj.weight_scale": "model-00097-of-00189.safetensors",
+ "model.layers.48.self_attn.v_proj.weight": "model-00097-of-00189.safetensors",
+ "model.layers.48.self_attn.v_proj.weight_scale": "model-00097-of-00189.safetensors",
+ "model.layers.49.input_layernorm.bias": "model-00101-of-00189.safetensors",
+ "model.layers.49.input_layernorm.weight": "model-00101-of-00189.safetensors",
+ "model.layers.49.mlp.down_proj.weight": "model-00101-of-00189.safetensors",
+ "model.layers.49.mlp.down_proj.weight_scale": "model-00101-of-00189.safetensors",
+ "model.layers.49.mlp.up_proj.weight": "model-00100-of-00189.safetensors",
+ "model.layers.49.mlp.up_proj.weight_scale": "model-00100-of-00189.safetensors",
+ "model.layers.49.post_attention_layernorm.bias": "model-00101-of-00189.safetensors",
+ "model.layers.49.post_attention_layernorm.weight": "model-00101-of-00189.safetensors",
+ "model.layers.49.self_attn.k_proj.weight": "model-00099-of-00189.safetensors",
+ "model.layers.49.self_attn.k_proj.weight_scale": "model-00099-of-00189.safetensors",
+ "model.layers.49.self_attn.o_proj.weight": "model-00099-of-00189.safetensors",
+ "model.layers.49.self_attn.o_proj.weight_scale": "model-00099-of-00189.safetensors",
+ "model.layers.49.self_attn.q_proj.weight": "model-00099-of-00189.safetensors",
+ "model.layers.49.self_attn.q_proj.weight_scale": "model-00099-of-00189.safetensors",
+ "model.layers.49.self_attn.v_proj.weight": "model-00099-of-00189.safetensors",
+ "model.layers.49.self_attn.v_proj.weight_scale": "model-00099-of-00189.safetensors",
+ "model.layers.5.input_layernorm.bias": "model-00013-of-00189.safetensors",
+ "model.layers.5.input_layernorm.weight": "model-00013-of-00189.safetensors",
+ "model.layers.5.mlp.down_proj.weight": "model-00013-of-00189.safetensors",
+ "model.layers.5.mlp.down_proj.weight_scale": "model-00013-of-00189.safetensors",
+ "model.layers.5.mlp.up_proj.weight": "model-00012-of-00189.safetensors",
+ "model.layers.5.mlp.up_proj.weight_scale": "model-00012-of-00189.safetensors",
+ "model.layers.5.post_attention_layernorm.bias": "model-00013-of-00189.safetensors",
+ "model.layers.5.post_attention_layernorm.weight": "model-00013-of-00189.safetensors",
+ "model.layers.5.self_attn.k_proj.weight": "model-00011-of-00189.safetensors",
+ "model.layers.5.self_attn.k_proj.weight_scale": "model-00011-of-00189.safetensors",
+ "model.layers.5.self_attn.o_proj.weight": "model-00011-of-00189.safetensors",
+ "model.layers.5.self_attn.o_proj.weight_scale": "model-00011-of-00189.safetensors",
+ "model.layers.5.self_attn.q_proj.weight": "model-00011-of-00189.safetensors",
+ "model.layers.5.self_attn.q_proj.weight_scale": "model-00011-of-00189.safetensors",
+ "model.layers.5.self_attn.v_proj.weight": "model-00011-of-00189.safetensors",
+ "model.layers.5.self_attn.v_proj.weight_scale": "model-00011-of-00189.safetensors",
+ "model.layers.50.input_layernorm.bias": "model-00103-of-00189.safetensors",
+ "model.layers.50.input_layernorm.weight": "model-00103-of-00189.safetensors",
+ "model.layers.50.mlp.down_proj.weight": "model-00103-of-00189.safetensors",
+ "model.layers.50.mlp.down_proj.weight_scale": "model-00103-of-00189.safetensors",
+ "model.layers.50.mlp.up_proj.weight": "model-00102-of-00189.safetensors",
+ "model.layers.50.mlp.up_proj.weight_scale": "model-00102-of-00189.safetensors",
+ "model.layers.50.post_attention_layernorm.bias": "model-00103-of-00189.safetensors",
+ "model.layers.50.post_attention_layernorm.weight": "model-00103-of-00189.safetensors",
+ "model.layers.50.self_attn.k_proj.weight": "model-00101-of-00189.safetensors",
+ "model.layers.50.self_attn.k_proj.weight_scale": "model-00101-of-00189.safetensors",
+ "model.layers.50.self_attn.o_proj.weight": "model-00101-of-00189.safetensors",
+ "model.layers.50.self_attn.o_proj.weight_scale": "model-00101-of-00189.safetensors",
+ "model.layers.50.self_attn.q_proj.weight": "model-00101-of-00189.safetensors",
+ "model.layers.50.self_attn.q_proj.weight_scale": "model-00101-of-00189.safetensors",
+ "model.layers.50.self_attn.v_proj.weight": "model-00101-of-00189.safetensors",
+ "model.layers.50.self_attn.v_proj.weight_scale": "model-00101-of-00189.safetensors",
+ "model.layers.51.input_layernorm.bias": "model-00105-of-00189.safetensors",
+ "model.layers.51.input_layernorm.weight": "model-00105-of-00189.safetensors",
+ "model.layers.51.mlp.down_proj.weight": "model-00105-of-00189.safetensors",
+ "model.layers.51.mlp.down_proj.weight_scale": "model-00105-of-00189.safetensors",
+ "model.layers.51.mlp.up_proj.weight": "model-00104-of-00189.safetensors",
+ "model.layers.51.mlp.up_proj.weight_scale": "model-00104-of-00189.safetensors",
+ "model.layers.51.post_attention_layernorm.bias": "model-00105-of-00189.safetensors",
+ "model.layers.51.post_attention_layernorm.weight": "model-00105-of-00189.safetensors",
+ "model.layers.51.self_attn.k_proj.weight": "model-00103-of-00189.safetensors",
+ "model.layers.51.self_attn.k_proj.weight_scale": "model-00103-of-00189.safetensors",
+ "model.layers.51.self_attn.o_proj.weight": "model-00103-of-00189.safetensors",
+ "model.layers.51.self_attn.o_proj.weight_scale": "model-00103-of-00189.safetensors",
+ "model.layers.51.self_attn.q_proj.weight": "model-00103-of-00189.safetensors",
+ "model.layers.51.self_attn.q_proj.weight_scale": "model-00103-of-00189.safetensors",
+ "model.layers.51.self_attn.v_proj.weight": "model-00103-of-00189.safetensors",
+ "model.layers.51.self_attn.v_proj.weight_scale": "model-00103-of-00189.safetensors",
+ "model.layers.52.input_layernorm.bias": "model-00107-of-00189.safetensors",
+ "model.layers.52.input_layernorm.weight": "model-00107-of-00189.safetensors",
+ "model.layers.52.mlp.down_proj.weight": "model-00107-of-00189.safetensors",
+ "model.layers.52.mlp.down_proj.weight_scale": "model-00107-of-00189.safetensors",
+ "model.layers.52.mlp.up_proj.weight": "model-00106-of-00189.safetensors",
+ "model.layers.52.mlp.up_proj.weight_scale": "model-00106-of-00189.safetensors",
+ "model.layers.52.post_attention_layernorm.bias": "model-00107-of-00189.safetensors",
+ "model.layers.52.post_attention_layernorm.weight": "model-00107-of-00189.safetensors",
+ "model.layers.52.self_attn.k_proj.weight": "model-00105-of-00189.safetensors",
+ "model.layers.52.self_attn.k_proj.weight_scale": "model-00105-of-00189.safetensors",
+ "model.layers.52.self_attn.o_proj.weight": "model-00105-of-00189.safetensors",
+ "model.layers.52.self_attn.o_proj.weight_scale": "model-00105-of-00189.safetensors",
+ "model.layers.52.self_attn.q_proj.weight": "model-00105-of-00189.safetensors",
+ "model.layers.52.self_attn.q_proj.weight_scale": "model-00105-of-00189.safetensors",
+ "model.layers.52.self_attn.v_proj.weight": "model-00105-of-00189.safetensors",
+ "model.layers.52.self_attn.v_proj.weight_scale": "model-00105-of-00189.safetensors",
+ "model.layers.53.input_layernorm.bias": "model-00109-of-00189.safetensors",
+ "model.layers.53.input_layernorm.weight": "model-00109-of-00189.safetensors",
+ "model.layers.53.mlp.down_proj.weight": "model-00109-of-00189.safetensors",
+ "model.layers.53.mlp.down_proj.weight_scale": "model-00109-of-00189.safetensors",
+ "model.layers.53.mlp.up_proj.weight": "model-00108-of-00189.safetensors",
+ "model.layers.53.mlp.up_proj.weight_scale": "model-00108-of-00189.safetensors",
+ "model.layers.53.post_attention_layernorm.bias": "model-00109-of-00189.safetensors",
+ "model.layers.53.post_attention_layernorm.weight": "model-00109-of-00189.safetensors",
+ "model.layers.53.self_attn.k_proj.weight": "model-00107-of-00189.safetensors",
+ "model.layers.53.self_attn.k_proj.weight_scale": "model-00107-of-00189.safetensors",
+ "model.layers.53.self_attn.o_proj.weight": "model-00107-of-00189.safetensors",
+ "model.layers.53.self_attn.o_proj.weight_scale": "model-00107-of-00189.safetensors",
+ "model.layers.53.self_attn.q_proj.weight": "model-00107-of-00189.safetensors",
+ "model.layers.53.self_attn.q_proj.weight_scale": "model-00107-of-00189.safetensors",
+ "model.layers.53.self_attn.v_proj.weight": "model-00107-of-00189.safetensors",
+ "model.layers.53.self_attn.v_proj.weight_scale": "model-00107-of-00189.safetensors",
+ "model.layers.54.input_layernorm.bias": "model-00111-of-00189.safetensors",
+ "model.layers.54.input_layernorm.weight": "model-00111-of-00189.safetensors",
+ "model.layers.54.mlp.down_proj.weight": "model-00111-of-00189.safetensors",
+ "model.layers.54.mlp.down_proj.weight_scale": "model-00111-of-00189.safetensors",
+ "model.layers.54.mlp.up_proj.weight": "model-00110-of-00189.safetensors",
+ "model.layers.54.mlp.up_proj.weight_scale": "model-00110-of-00189.safetensors",
+ "model.layers.54.post_attention_layernorm.bias": "model-00111-of-00189.safetensors",
+ "model.layers.54.post_attention_layernorm.weight": "model-00111-of-00189.safetensors",
+ "model.layers.54.self_attn.k_proj.weight": "model-00109-of-00189.safetensors",
+ "model.layers.54.self_attn.k_proj.weight_scale": "model-00109-of-00189.safetensors",
+ "model.layers.54.self_attn.o_proj.weight": "model-00109-of-00189.safetensors",
+ "model.layers.54.self_attn.o_proj.weight_scale": "model-00109-of-00189.safetensors",
+ "model.layers.54.self_attn.q_proj.weight": "model-00109-of-00189.safetensors",
+ "model.layers.54.self_attn.q_proj.weight_scale": "model-00109-of-00189.safetensors",
+ "model.layers.54.self_attn.v_proj.weight": "model-00109-of-00189.safetensors",
+ "model.layers.54.self_attn.v_proj.weight_scale": "model-00109-of-00189.safetensors",
+ "model.layers.55.input_layernorm.bias": "model-00113-of-00189.safetensors",
+ "model.layers.55.input_layernorm.weight": "model-00113-of-00189.safetensors",
+ "model.layers.55.mlp.down_proj.weight": "model-00113-of-00189.safetensors",
+ "model.layers.55.mlp.down_proj.weight_scale": "model-00113-of-00189.safetensors",
+ "model.layers.55.mlp.up_proj.weight": "model-00112-of-00189.safetensors",
+ "model.layers.55.mlp.up_proj.weight_scale": "model-00112-of-00189.safetensors",
+ "model.layers.55.post_attention_layernorm.bias": "model-00113-of-00189.safetensors",
+ "model.layers.55.post_attention_layernorm.weight": "model-00113-of-00189.safetensors",
+ "model.layers.55.self_attn.k_proj.weight": "model-00111-of-00189.safetensors",
+ "model.layers.55.self_attn.k_proj.weight_scale": "model-00111-of-00189.safetensors",
+ "model.layers.55.self_attn.o_proj.weight": "model-00111-of-00189.safetensors",
+ "model.layers.55.self_attn.o_proj.weight_scale": "model-00111-of-00189.safetensors",
+ "model.layers.55.self_attn.q_proj.weight": "model-00111-of-00189.safetensors",
+ "model.layers.55.self_attn.q_proj.weight_scale": "model-00111-of-00189.safetensors",
+ "model.layers.55.self_attn.v_proj.weight": "model-00111-of-00189.safetensors",
+ "model.layers.55.self_attn.v_proj.weight_scale": "model-00111-of-00189.safetensors",
+ "model.layers.56.input_layernorm.bias": "model-00115-of-00189.safetensors",
+ "model.layers.56.input_layernorm.weight": "model-00115-of-00189.safetensors",
+ "model.layers.56.mlp.down_proj.weight": "model-00115-of-00189.safetensors",
+ "model.layers.56.mlp.down_proj.weight_scale": "model-00115-of-00189.safetensors",
+ "model.layers.56.mlp.up_proj.weight": "model-00114-of-00189.safetensors",
+ "model.layers.56.mlp.up_proj.weight_scale": "model-00114-of-00189.safetensors",
+ "model.layers.56.post_attention_layernorm.bias": "model-00115-of-00189.safetensors",
+ "model.layers.56.post_attention_layernorm.weight": "model-00115-of-00189.safetensors",
+ "model.layers.56.self_attn.k_proj.weight": "model-00113-of-00189.safetensors",
+ "model.layers.56.self_attn.k_proj.weight_scale": "model-00113-of-00189.safetensors",
+ "model.layers.56.self_attn.o_proj.weight": "model-00113-of-00189.safetensors",
+ "model.layers.56.self_attn.o_proj.weight_scale": "model-00113-of-00189.safetensors",
+ "model.layers.56.self_attn.q_proj.weight": "model-00113-of-00189.safetensors",
+ "model.layers.56.self_attn.q_proj.weight_scale": "model-00113-of-00189.safetensors",
+ "model.layers.56.self_attn.v_proj.weight": "model-00113-of-00189.safetensors",
+ "model.layers.56.self_attn.v_proj.weight_scale": "model-00113-of-00189.safetensors",
+ "model.layers.57.input_layernorm.bias": "model-00117-of-00189.safetensors",
+ "model.layers.57.input_layernorm.weight": "model-00117-of-00189.safetensors",
+ "model.layers.57.mlp.down_proj.weight": "model-00117-of-00189.safetensors",
+ "model.layers.57.mlp.down_proj.weight_scale": "model-00117-of-00189.safetensors",
+ "model.layers.57.mlp.up_proj.weight": "model-00116-of-00189.safetensors",
+ "model.layers.57.mlp.up_proj.weight_scale": "model-00116-of-00189.safetensors",
+ "model.layers.57.post_attention_layernorm.bias": "model-00117-of-00189.safetensors",
+ "model.layers.57.post_attention_layernorm.weight": "model-00117-of-00189.safetensors",
+ "model.layers.57.self_attn.k_proj.weight": "model-00115-of-00189.safetensors",
+ "model.layers.57.self_attn.k_proj.weight_scale": "model-00115-of-00189.safetensors",
+ "model.layers.57.self_attn.o_proj.weight": "model-00115-of-00189.safetensors",
+ "model.layers.57.self_attn.o_proj.weight_scale": "model-00115-of-00189.safetensors",
+ "model.layers.57.self_attn.q_proj.weight": "model-00115-of-00189.safetensors",
+ "model.layers.57.self_attn.q_proj.weight_scale": "model-00115-of-00189.safetensors",
+ "model.layers.57.self_attn.v_proj.weight": "model-00115-of-00189.safetensors",
+ "model.layers.57.self_attn.v_proj.weight_scale": "model-00115-of-00189.safetensors",
+ "model.layers.58.input_layernorm.bias": "model-00119-of-00189.safetensors",
+ "model.layers.58.input_layernorm.weight": "model-00119-of-00189.safetensors",
+ "model.layers.58.mlp.down_proj.weight": "model-00119-of-00189.safetensors",
+ "model.layers.58.mlp.down_proj.weight_scale": "model-00119-of-00189.safetensors",
+ "model.layers.58.mlp.up_proj.weight": "model-00118-of-00189.safetensors",
+ "model.layers.58.mlp.up_proj.weight_scale": "model-00118-of-00189.safetensors",
+ "model.layers.58.post_attention_layernorm.bias": "model-00119-of-00189.safetensors",
+ "model.layers.58.post_attention_layernorm.weight": "model-00119-of-00189.safetensors",
+ "model.layers.58.self_attn.k_proj.weight": "model-00117-of-00189.safetensors",
+ "model.layers.58.self_attn.k_proj.weight_scale": "model-00117-of-00189.safetensors",
+ "model.layers.58.self_attn.o_proj.weight": "model-00117-of-00189.safetensors",
+ "model.layers.58.self_attn.o_proj.weight_scale": "model-00117-of-00189.safetensors",
+ "model.layers.58.self_attn.q_proj.weight": "model-00117-of-00189.safetensors",
+ "model.layers.58.self_attn.q_proj.weight_scale": "model-00117-of-00189.safetensors",
+ "model.layers.58.self_attn.v_proj.weight": "model-00117-of-00189.safetensors",
+ "model.layers.58.self_attn.v_proj.weight_scale": "model-00117-of-00189.safetensors",
+ "model.layers.59.input_layernorm.bias": "model-00121-of-00189.safetensors",
+ "model.layers.59.input_layernorm.weight": "model-00121-of-00189.safetensors",
+ "model.layers.59.mlp.down_proj.weight": "model-00121-of-00189.safetensors",
+ "model.layers.59.mlp.down_proj.weight_scale": "model-00121-of-00189.safetensors",
+ "model.layers.59.mlp.up_proj.weight": "model-00120-of-00189.safetensors",
+ "model.layers.59.mlp.up_proj.weight_scale": "model-00120-of-00189.safetensors",
+ "model.layers.59.post_attention_layernorm.bias": "model-00121-of-00189.safetensors",
+ "model.layers.59.post_attention_layernorm.weight": "model-00121-of-00189.safetensors",
+ "model.layers.59.self_attn.k_proj.weight": "model-00119-of-00189.safetensors",
+ "model.layers.59.self_attn.k_proj.weight_scale": "model-00119-of-00189.safetensors",
+ "model.layers.59.self_attn.o_proj.weight": "model-00119-of-00189.safetensors",
+ "model.layers.59.self_attn.o_proj.weight_scale": "model-00119-of-00189.safetensors",
+ "model.layers.59.self_attn.q_proj.weight": "model-00119-of-00189.safetensors",
+ "model.layers.59.self_attn.q_proj.weight_scale": "model-00119-of-00189.safetensors",
+ "model.layers.59.self_attn.v_proj.weight": "model-00119-of-00189.safetensors",
+ "model.layers.59.self_attn.v_proj.weight_scale": "model-00119-of-00189.safetensors",
+ "model.layers.6.input_layernorm.bias": "model-00015-of-00189.safetensors",
+ "model.layers.6.input_layernorm.weight": "model-00015-of-00189.safetensors",
+ "model.layers.6.mlp.down_proj.weight": "model-00015-of-00189.safetensors",
+ "model.layers.6.mlp.down_proj.weight_scale": "model-00015-of-00189.safetensors",
+ "model.layers.6.mlp.up_proj.weight": "model-00014-of-00189.safetensors",
+ "model.layers.6.mlp.up_proj.weight_scale": "model-00014-of-00189.safetensors",
+ "model.layers.6.post_attention_layernorm.bias": "model-00015-of-00189.safetensors",
+ "model.layers.6.post_attention_layernorm.weight": "model-00015-of-00189.safetensors",
+ "model.layers.6.self_attn.k_proj.weight": "model-00013-of-00189.safetensors",
+ "model.layers.6.self_attn.k_proj.weight_scale": "model-00013-of-00189.safetensors",
+ "model.layers.6.self_attn.o_proj.weight": "model-00013-of-00189.safetensors",
+ "model.layers.6.self_attn.o_proj.weight_scale": "model-00013-of-00189.safetensors",
+ "model.layers.6.self_attn.q_proj.weight": "model-00013-of-00189.safetensors",
+ "model.layers.6.self_attn.q_proj.weight_scale": "model-00013-of-00189.safetensors",
+ "model.layers.6.self_attn.v_proj.weight": "model-00013-of-00189.safetensors",
+ "model.layers.6.self_attn.v_proj.weight_scale": "model-00013-of-00189.safetensors",
+ "model.layers.60.input_layernorm.bias": "model-00123-of-00189.safetensors",
+ "model.layers.60.input_layernorm.weight": "model-00123-of-00189.safetensors",
+ "model.layers.60.mlp.down_proj.weight": "model-00123-of-00189.safetensors",
+ "model.layers.60.mlp.down_proj.weight_scale": "model-00123-of-00189.safetensors",
+ "model.layers.60.mlp.up_proj.weight": "model-00122-of-00189.safetensors",
+ "model.layers.60.mlp.up_proj.weight_scale": "model-00122-of-00189.safetensors",
+ "model.layers.60.post_attention_layernorm.bias": "model-00123-of-00189.safetensors",
+ "model.layers.60.post_attention_layernorm.weight": "model-00123-of-00189.safetensors",
+ "model.layers.60.self_attn.k_proj.weight": "model-00121-of-00189.safetensors",
+ "model.layers.60.self_attn.k_proj.weight_scale": "model-00121-of-00189.safetensors",
+ "model.layers.60.self_attn.o_proj.weight": "model-00121-of-00189.safetensors",
+ "model.layers.60.self_attn.o_proj.weight_scale": "model-00121-of-00189.safetensors",
+ "model.layers.60.self_attn.q_proj.weight": "model-00121-of-00189.safetensors",
+ "model.layers.60.self_attn.q_proj.weight_scale": "model-00121-of-00189.safetensors",
+ "model.layers.60.self_attn.v_proj.weight": "model-00121-of-00189.safetensors",
+ "model.layers.60.self_attn.v_proj.weight_scale": "model-00121-of-00189.safetensors",
+ "model.layers.61.input_layernorm.bias": "model-00125-of-00189.safetensors",
+ "model.layers.61.input_layernorm.weight": "model-00125-of-00189.safetensors",
+ "model.layers.61.mlp.down_proj.weight": "model-00125-of-00189.safetensors",
+ "model.layers.61.mlp.down_proj.weight_scale": "model-00125-of-00189.safetensors",
+ "model.layers.61.mlp.up_proj.weight": "model-00124-of-00189.safetensors",
+ "model.layers.61.mlp.up_proj.weight_scale": "model-00124-of-00189.safetensors",
+ "model.layers.61.post_attention_layernorm.bias": "model-00125-of-00189.safetensors",
+ "model.layers.61.post_attention_layernorm.weight": "model-00125-of-00189.safetensors",
+ "model.layers.61.self_attn.k_proj.weight": "model-00123-of-00189.safetensors",
+ "model.layers.61.self_attn.k_proj.weight_scale": "model-00123-of-00189.safetensors",
+ "model.layers.61.self_attn.o_proj.weight": "model-00123-of-00189.safetensors",
+ "model.layers.61.self_attn.o_proj.weight_scale": "model-00123-of-00189.safetensors",
+ "model.layers.61.self_attn.q_proj.weight": "model-00123-of-00189.safetensors",
+ "model.layers.61.self_attn.q_proj.weight_scale": "model-00123-of-00189.safetensors",
+ "model.layers.61.self_attn.v_proj.weight": "model-00123-of-00189.safetensors",
+ "model.layers.61.self_attn.v_proj.weight_scale": "model-00123-of-00189.safetensors",
+ "model.layers.62.input_layernorm.bias": "model-00127-of-00189.safetensors",
+ "model.layers.62.input_layernorm.weight": "model-00127-of-00189.safetensors",
+ "model.layers.62.mlp.down_proj.weight": "model-00127-of-00189.safetensors",
+ "model.layers.62.mlp.down_proj.weight_scale": "model-00127-of-00189.safetensors",
+ "model.layers.62.mlp.up_proj.weight": "model-00126-of-00189.safetensors",
+ "model.layers.62.mlp.up_proj.weight_scale": "model-00126-of-00189.safetensors",
+ "model.layers.62.post_attention_layernorm.bias": "model-00127-of-00189.safetensors",
+ "model.layers.62.post_attention_layernorm.weight": "model-00127-of-00189.safetensors",
+ "model.layers.62.self_attn.k_proj.weight": "model-00125-of-00189.safetensors",
+ "model.layers.62.self_attn.k_proj.weight_scale": "model-00125-of-00189.safetensors",
+ "model.layers.62.self_attn.o_proj.weight": "model-00125-of-00189.safetensors",
+ "model.layers.62.self_attn.o_proj.weight_scale": "model-00125-of-00189.safetensors",
+ "model.layers.62.self_attn.q_proj.weight": "model-00125-of-00189.safetensors",
+ "model.layers.62.self_attn.q_proj.weight_scale": "model-00125-of-00189.safetensors",
+ "model.layers.62.self_attn.v_proj.weight": "model-00125-of-00189.safetensors",
+ "model.layers.62.self_attn.v_proj.weight_scale": "model-00125-of-00189.safetensors",
+ "model.layers.63.input_layernorm.bias": "model-00129-of-00189.safetensors",
+ "model.layers.63.input_layernorm.weight": "model-00129-of-00189.safetensors",
+ "model.layers.63.mlp.down_proj.weight": "model-00129-of-00189.safetensors",
+ "model.layers.63.mlp.down_proj.weight_scale": "model-00129-of-00189.safetensors",
+ "model.layers.63.mlp.up_proj.weight": "model-00128-of-00189.safetensors",
+ "model.layers.63.mlp.up_proj.weight_scale": "model-00128-of-00189.safetensors",
+ "model.layers.63.post_attention_layernorm.bias": "model-00129-of-00189.safetensors",
+ "model.layers.63.post_attention_layernorm.weight": "model-00129-of-00189.safetensors",
+ "model.layers.63.self_attn.k_proj.weight": "model-00127-of-00189.safetensors",
+ "model.layers.63.self_attn.k_proj.weight_scale": "model-00127-of-00189.safetensors",
+ "model.layers.63.self_attn.o_proj.weight": "model-00127-of-00189.safetensors",
+ "model.layers.63.self_attn.o_proj.weight_scale": "model-00127-of-00189.safetensors",
+ "model.layers.63.self_attn.q_proj.weight": "model-00127-of-00189.safetensors",
+ "model.layers.63.self_attn.q_proj.weight_scale": "model-00127-of-00189.safetensors",
+ "model.layers.63.self_attn.v_proj.weight": "model-00127-of-00189.safetensors",
+ "model.layers.63.self_attn.v_proj.weight_scale": "model-00127-of-00189.safetensors",
+ "model.layers.64.input_layernorm.bias": "model-00131-of-00189.safetensors",
+ "model.layers.64.input_layernorm.weight": "model-00131-of-00189.safetensors",
+ "model.layers.64.mlp.down_proj.weight": "model-00131-of-00189.safetensors",
+ "model.layers.64.mlp.down_proj.weight_scale": "model-00131-of-00189.safetensors",
+ "model.layers.64.mlp.up_proj.weight": "model-00130-of-00189.safetensors",
+ "model.layers.64.mlp.up_proj.weight_scale": "model-00130-of-00189.safetensors",
+ "model.layers.64.post_attention_layernorm.bias": "model-00131-of-00189.safetensors",
+ "model.layers.64.post_attention_layernorm.weight": "model-00131-of-00189.safetensors",
+ "model.layers.64.self_attn.k_proj.weight": "model-00129-of-00189.safetensors",
+ "model.layers.64.self_attn.k_proj.weight_scale": "model-00129-of-00189.safetensors",
+ "model.layers.64.self_attn.o_proj.weight": "model-00129-of-00189.safetensors",
+ "model.layers.64.self_attn.o_proj.weight_scale": "model-00129-of-00189.safetensors",
+ "model.layers.64.self_attn.q_proj.weight": "model-00129-of-00189.safetensors",
+ "model.layers.64.self_attn.q_proj.weight_scale": "model-00129-of-00189.safetensors",
+ "model.layers.64.self_attn.v_proj.weight": "model-00129-of-00189.safetensors",
+ "model.layers.64.self_attn.v_proj.weight_scale": "model-00129-of-00189.safetensors",
+ "model.layers.65.input_layernorm.bias": "model-00133-of-00189.safetensors",
+ "model.layers.65.input_layernorm.weight": "model-00133-of-00189.safetensors",
+ "model.layers.65.mlp.down_proj.weight": "model-00133-of-00189.safetensors",
+ "model.layers.65.mlp.down_proj.weight_scale": "model-00133-of-00189.safetensors",
+ "model.layers.65.mlp.up_proj.weight": "model-00132-of-00189.safetensors",
+ "model.layers.65.mlp.up_proj.weight_scale": "model-00132-of-00189.safetensors",
+ "model.layers.65.post_attention_layernorm.bias": "model-00133-of-00189.safetensors",
+ "model.layers.65.post_attention_layernorm.weight": "model-00133-of-00189.safetensors",
+ "model.layers.65.self_attn.k_proj.weight": "model-00131-of-00189.safetensors",
+ "model.layers.65.self_attn.k_proj.weight_scale": "model-00131-of-00189.safetensors",
+ "model.layers.65.self_attn.o_proj.weight": "model-00131-of-00189.safetensors",
+ "model.layers.65.self_attn.o_proj.weight_scale": "model-00131-of-00189.safetensors",
+ "model.layers.65.self_attn.q_proj.weight": "model-00131-of-00189.safetensors",
+ "model.layers.65.self_attn.q_proj.weight_scale": "model-00131-of-00189.safetensors",
+ "model.layers.65.self_attn.v_proj.weight": "model-00131-of-00189.safetensors",
+ "model.layers.65.self_attn.v_proj.weight_scale": "model-00131-of-00189.safetensors",
+ "model.layers.66.input_layernorm.bias": "model-00135-of-00189.safetensors",
+ "model.layers.66.input_layernorm.weight": "model-00135-of-00189.safetensors",
+ "model.layers.66.mlp.down_proj.weight": "model-00135-of-00189.safetensors",
+ "model.layers.66.mlp.down_proj.weight_scale": "model-00135-of-00189.safetensors",
+ "model.layers.66.mlp.up_proj.weight": "model-00134-of-00189.safetensors",
+ "model.layers.66.mlp.up_proj.weight_scale": "model-00134-of-00189.safetensors",
+ "model.layers.66.post_attention_layernorm.bias": "model-00135-of-00189.safetensors",
+ "model.layers.66.post_attention_layernorm.weight": "model-00135-of-00189.safetensors",
+ "model.layers.66.self_attn.k_proj.weight": "model-00133-of-00189.safetensors",
+ "model.layers.66.self_attn.k_proj.weight_scale": "model-00133-of-00189.safetensors",
+ "model.layers.66.self_attn.o_proj.weight": "model-00133-of-00189.safetensors",
+ "model.layers.66.self_attn.o_proj.weight_scale": "model-00133-of-00189.safetensors",
+ "model.layers.66.self_attn.q_proj.weight": "model-00133-of-00189.safetensors",
+ "model.layers.66.self_attn.q_proj.weight_scale": "model-00133-of-00189.safetensors",
+ "model.layers.66.self_attn.v_proj.weight": "model-00133-of-00189.safetensors",
+ "model.layers.66.self_attn.v_proj.weight_scale": "model-00133-of-00189.safetensors",
+ "model.layers.67.input_layernorm.bias": "model-00137-of-00189.safetensors",
+ "model.layers.67.input_layernorm.weight": "model-00137-of-00189.safetensors",
+ "model.layers.67.mlp.down_proj.weight": "model-00137-of-00189.safetensors",
+ "model.layers.67.mlp.down_proj.weight_scale": "model-00137-of-00189.safetensors",
+ "model.layers.67.mlp.up_proj.weight": "model-00136-of-00189.safetensors",
+ "model.layers.67.mlp.up_proj.weight_scale": "model-00136-of-00189.safetensors",
+ "model.layers.67.post_attention_layernorm.bias": "model-00137-of-00189.safetensors",
+ "model.layers.67.post_attention_layernorm.weight": "model-00137-of-00189.safetensors",
+ "model.layers.67.self_attn.k_proj.weight": "model-00135-of-00189.safetensors",
+ "model.layers.67.self_attn.k_proj.weight_scale": "model-00135-of-00189.safetensors",
+ "model.layers.67.self_attn.o_proj.weight": "model-00135-of-00189.safetensors",
+ "model.layers.67.self_attn.o_proj.weight_scale": "model-00135-of-00189.safetensors",
+ "model.layers.67.self_attn.q_proj.weight": "model-00135-of-00189.safetensors",
+ "model.layers.67.self_attn.q_proj.weight_scale": "model-00135-of-00189.safetensors",
+ "model.layers.67.self_attn.v_proj.weight": "model-00135-of-00189.safetensors",
+ "model.layers.67.self_attn.v_proj.weight_scale": "model-00135-of-00189.safetensors",
+ "model.layers.68.input_layernorm.bias": "model-00139-of-00189.safetensors",
+ "model.layers.68.input_layernorm.weight": "model-00139-of-00189.safetensors",
+ "model.layers.68.mlp.down_proj.weight": "model-00139-of-00189.safetensors",
+ "model.layers.68.mlp.down_proj.weight_scale": "model-00139-of-00189.safetensors",
+ "model.layers.68.mlp.up_proj.weight": "model-00138-of-00189.safetensors",
+ "model.layers.68.mlp.up_proj.weight_scale": "model-00138-of-00189.safetensors",
+ "model.layers.68.post_attention_layernorm.bias": "model-00139-of-00189.safetensors",
+ "model.layers.68.post_attention_layernorm.weight": "model-00139-of-00189.safetensors",
+ "model.layers.68.self_attn.k_proj.weight": "model-00137-of-00189.safetensors",
+ "model.layers.68.self_attn.k_proj.weight_scale": "model-00137-of-00189.safetensors",
+ "model.layers.68.self_attn.o_proj.weight": "model-00137-of-00189.safetensors",
+ "model.layers.68.self_attn.o_proj.weight_scale": "model-00137-of-00189.safetensors",
+ "model.layers.68.self_attn.q_proj.weight": "model-00137-of-00189.safetensors",
+ "model.layers.68.self_attn.q_proj.weight_scale": "model-00137-of-00189.safetensors",
+ "model.layers.68.self_attn.v_proj.weight": "model-00137-of-00189.safetensors",
+ "model.layers.68.self_attn.v_proj.weight_scale": "model-00137-of-00189.safetensors",
+ "model.layers.69.input_layernorm.bias": "model-00141-of-00189.safetensors",
+ "model.layers.69.input_layernorm.weight": "model-00141-of-00189.safetensors",
+ "model.layers.69.mlp.down_proj.weight": "model-00141-of-00189.safetensors",
+ "model.layers.69.mlp.down_proj.weight_scale": "model-00141-of-00189.safetensors",
+ "model.layers.69.mlp.up_proj.weight": "model-00140-of-00189.safetensors",
+ "model.layers.69.mlp.up_proj.weight_scale": "model-00140-of-00189.safetensors",
+ "model.layers.69.post_attention_layernorm.bias": "model-00141-of-00189.safetensors",
+ "model.layers.69.post_attention_layernorm.weight": "model-00141-of-00189.safetensors",
+ "model.layers.69.self_attn.k_proj.weight": "model-00139-of-00189.safetensors",
+ "model.layers.69.self_attn.k_proj.weight_scale": "model-00139-of-00189.safetensors",
+ "model.layers.69.self_attn.o_proj.weight": "model-00139-of-00189.safetensors",
+ "model.layers.69.self_attn.o_proj.weight_scale": "model-00139-of-00189.safetensors",
+ "model.layers.69.self_attn.q_proj.weight": "model-00139-of-00189.safetensors",
+ "model.layers.69.self_attn.q_proj.weight_scale": "model-00139-of-00189.safetensors",
+ "model.layers.69.self_attn.v_proj.weight": "model-00139-of-00189.safetensors",
+ "model.layers.69.self_attn.v_proj.weight_scale": "model-00139-of-00189.safetensors",
+ "model.layers.7.input_layernorm.bias": "model-00017-of-00189.safetensors",
+ "model.layers.7.input_layernorm.weight": "model-00017-of-00189.safetensors",
+ "model.layers.7.mlp.down_proj.weight": "model-00017-of-00189.safetensors",
+ "model.layers.7.mlp.down_proj.weight_scale": "model-00017-of-00189.safetensors",
+ "model.layers.7.mlp.up_proj.weight": "model-00016-of-00189.safetensors",
+ "model.layers.7.mlp.up_proj.weight_scale": "model-00016-of-00189.safetensors",
+ "model.layers.7.post_attention_layernorm.bias": "model-00017-of-00189.safetensors",
+ "model.layers.7.post_attention_layernorm.weight": "model-00017-of-00189.safetensors",
+ "model.layers.7.self_attn.k_proj.weight": "model-00015-of-00189.safetensors",
+ "model.layers.7.self_attn.k_proj.weight_scale": "model-00015-of-00189.safetensors",
+ "model.layers.7.self_attn.o_proj.weight": "model-00015-of-00189.safetensors",
+ "model.layers.7.self_attn.o_proj.weight_scale": "model-00015-of-00189.safetensors",
+ "model.layers.7.self_attn.q_proj.weight": "model-00015-of-00189.safetensors",
+ "model.layers.7.self_attn.q_proj.weight_scale": "model-00015-of-00189.safetensors",
+ "model.layers.7.self_attn.v_proj.weight": "model-00015-of-00189.safetensors",
+ "model.layers.7.self_attn.v_proj.weight_scale": "model-00015-of-00189.safetensors",
+ "model.layers.70.input_layernorm.bias": "model-00143-of-00189.safetensors",
+ "model.layers.70.input_layernorm.weight": "model-00143-of-00189.safetensors",
+ "model.layers.70.mlp.down_proj.weight": "model-00143-of-00189.safetensors",
+ "model.layers.70.mlp.down_proj.weight_scale": "model-00143-of-00189.safetensors",
+ "model.layers.70.mlp.up_proj.weight": "model-00142-of-00189.safetensors",
+ "model.layers.70.mlp.up_proj.weight_scale": "model-00142-of-00189.safetensors",
+ "model.layers.70.post_attention_layernorm.bias": "model-00143-of-00189.safetensors",
+ "model.layers.70.post_attention_layernorm.weight": "model-00143-of-00189.safetensors",
+ "model.layers.70.self_attn.k_proj.weight": "model-00141-of-00189.safetensors",
+ "model.layers.70.self_attn.k_proj.weight_scale": "model-00141-of-00189.safetensors",
+ "model.layers.70.self_attn.o_proj.weight": "model-00141-of-00189.safetensors",
+ "model.layers.70.self_attn.o_proj.weight_scale": "model-00141-of-00189.safetensors",
+ "model.layers.70.self_attn.q_proj.weight": "model-00141-of-00189.safetensors",
+ "model.layers.70.self_attn.q_proj.weight_scale": "model-00141-of-00189.safetensors",
+ "model.layers.70.self_attn.v_proj.weight": "model-00141-of-00189.safetensors",
+ "model.layers.70.self_attn.v_proj.weight_scale": "model-00141-of-00189.safetensors",
+ "model.layers.71.input_layernorm.bias": "model-00145-of-00189.safetensors",
+ "model.layers.71.input_layernorm.weight": "model-00145-of-00189.safetensors",
+ "model.layers.71.mlp.down_proj.weight": "model-00145-of-00189.safetensors",
+ "model.layers.71.mlp.down_proj.weight_scale": "model-00145-of-00189.safetensors",
+ "model.layers.71.mlp.up_proj.weight": "model-00144-of-00189.safetensors",
+ "model.layers.71.mlp.up_proj.weight_scale": "model-00144-of-00189.safetensors",
+ "model.layers.71.post_attention_layernorm.bias": "model-00145-of-00189.safetensors",
+ "model.layers.71.post_attention_layernorm.weight": "model-00145-of-00189.safetensors",
+ "model.layers.71.self_attn.k_proj.weight": "model-00143-of-00189.safetensors",
+ "model.layers.71.self_attn.k_proj.weight_scale": "model-00143-of-00189.safetensors",
+ "model.layers.71.self_attn.o_proj.weight": "model-00143-of-00189.safetensors",
+ "model.layers.71.self_attn.o_proj.weight_scale": "model-00143-of-00189.safetensors",
+ "model.layers.71.self_attn.q_proj.weight": "model-00143-of-00189.safetensors",
+ "model.layers.71.self_attn.q_proj.weight_scale": "model-00143-of-00189.safetensors",
+ "model.layers.71.self_attn.v_proj.weight": "model-00143-of-00189.safetensors",
+ "model.layers.71.self_attn.v_proj.weight_scale": "model-00143-of-00189.safetensors",
+ "model.layers.72.input_layernorm.bias": "model-00147-of-00189.safetensors",
+ "model.layers.72.input_layernorm.weight": "model-00147-of-00189.safetensors",
+ "model.layers.72.mlp.down_proj.weight": "model-00147-of-00189.safetensors",
+ "model.layers.72.mlp.down_proj.weight_scale": "model-00147-of-00189.safetensors",
+ "model.layers.72.mlp.up_proj.weight": "model-00146-of-00189.safetensors",
+ "model.layers.72.mlp.up_proj.weight_scale": "model-00146-of-00189.safetensors",
+ "model.layers.72.post_attention_layernorm.bias": "model-00147-of-00189.safetensors",
+ "model.layers.72.post_attention_layernorm.weight": "model-00147-of-00189.safetensors",
+ "model.layers.72.self_attn.k_proj.weight": "model-00145-of-00189.safetensors",
+ "model.layers.72.self_attn.k_proj.weight_scale": "model-00145-of-00189.safetensors",
+ "model.layers.72.self_attn.o_proj.weight": "model-00145-of-00189.safetensors",
+ "model.layers.72.self_attn.o_proj.weight_scale": "model-00145-of-00189.safetensors",
+ "model.layers.72.self_attn.q_proj.weight": "model-00145-of-00189.safetensors",
+ "model.layers.72.self_attn.q_proj.weight_scale": "model-00145-of-00189.safetensors",
+ "model.layers.72.self_attn.v_proj.weight": "model-00145-of-00189.safetensors",
+ "model.layers.72.self_attn.v_proj.weight_scale": "model-00145-of-00189.safetensors",
+ "model.layers.73.input_layernorm.bias": "model-00149-of-00189.safetensors",
+ "model.layers.73.input_layernorm.weight": "model-00149-of-00189.safetensors",
+ "model.layers.73.mlp.down_proj.weight": "model-00149-of-00189.safetensors",
+ "model.layers.73.mlp.down_proj.weight_scale": "model-00149-of-00189.safetensors",
+ "model.layers.73.mlp.up_proj.weight": "model-00148-of-00189.safetensors",
+ "model.layers.73.mlp.up_proj.weight_scale": "model-00148-of-00189.safetensors",
+ "model.layers.73.post_attention_layernorm.bias": "model-00149-of-00189.safetensors",
+ "model.layers.73.post_attention_layernorm.weight": "model-00149-of-00189.safetensors",
+ "model.layers.73.self_attn.k_proj.weight": "model-00147-of-00189.safetensors",
+ "model.layers.73.self_attn.k_proj.weight_scale": "model-00147-of-00189.safetensors",
+ "model.layers.73.self_attn.o_proj.weight": "model-00147-of-00189.safetensors",
+ "model.layers.73.self_attn.o_proj.weight_scale": "model-00147-of-00189.safetensors",
+ "model.layers.73.self_attn.q_proj.weight": "model-00147-of-00189.safetensors",
+ "model.layers.73.self_attn.q_proj.weight_scale": "model-00147-of-00189.safetensors",
+ "model.layers.73.self_attn.v_proj.weight": "model-00147-of-00189.safetensors",
+ "model.layers.73.self_attn.v_proj.weight_scale": "model-00147-of-00189.safetensors",
+ "model.layers.74.input_layernorm.bias": "model-00151-of-00189.safetensors",
+ "model.layers.74.input_layernorm.weight": "model-00151-of-00189.safetensors",
+ "model.layers.74.mlp.down_proj.weight": "model-00151-of-00189.safetensors",
+ "model.layers.74.mlp.down_proj.weight_scale": "model-00151-of-00189.safetensors",
+ "model.layers.74.mlp.up_proj.weight": "model-00150-of-00189.safetensors",
+ "model.layers.74.mlp.up_proj.weight_scale": "model-00150-of-00189.safetensors",
+ "model.layers.74.post_attention_layernorm.bias": "model-00151-of-00189.safetensors",
+ "model.layers.74.post_attention_layernorm.weight": "model-00151-of-00189.safetensors",
+ "model.layers.74.self_attn.k_proj.weight": "model-00149-of-00189.safetensors",
+ "model.layers.74.self_attn.k_proj.weight_scale": "model-00149-of-00189.safetensors",
+ "model.layers.74.self_attn.o_proj.weight": "model-00149-of-00189.safetensors",
+ "model.layers.74.self_attn.o_proj.weight_scale": "model-00149-of-00189.safetensors",
+ "model.layers.74.self_attn.q_proj.weight": "model-00149-of-00189.safetensors",
+ "model.layers.74.self_attn.q_proj.weight_scale": "model-00149-of-00189.safetensors",
+ "model.layers.74.self_attn.v_proj.weight": "model-00149-of-00189.safetensors",
+ "model.layers.74.self_attn.v_proj.weight_scale": "model-00149-of-00189.safetensors",
+ "model.layers.75.input_layernorm.bias": "model-00153-of-00189.safetensors",
+ "model.layers.75.input_layernorm.weight": "model-00153-of-00189.safetensors",
+ "model.layers.75.mlp.down_proj.weight": "model-00153-of-00189.safetensors",
+ "model.layers.75.mlp.down_proj.weight_scale": "model-00153-of-00189.safetensors",
+ "model.layers.75.mlp.up_proj.weight": "model-00152-of-00189.safetensors",
+ "model.layers.75.mlp.up_proj.weight_scale": "model-00152-of-00189.safetensors",
+ "model.layers.75.post_attention_layernorm.bias": "model-00153-of-00189.safetensors",
+ "model.layers.75.post_attention_layernorm.weight": "model-00153-of-00189.safetensors",
+ "model.layers.75.self_attn.k_proj.weight": "model-00151-of-00189.safetensors",
+ "model.layers.75.self_attn.k_proj.weight_scale": "model-00151-of-00189.safetensors",
+ "model.layers.75.self_attn.o_proj.weight": "model-00151-of-00189.safetensors",
+ "model.layers.75.self_attn.o_proj.weight_scale": "model-00151-of-00189.safetensors",
+ "model.layers.75.self_attn.q_proj.weight": "model-00151-of-00189.safetensors",
+ "model.layers.75.self_attn.q_proj.weight_scale": "model-00151-of-00189.safetensors",
+ "model.layers.75.self_attn.v_proj.weight": "model-00151-of-00189.safetensors",
+ "model.layers.75.self_attn.v_proj.weight_scale": "model-00151-of-00189.safetensors",
+ "model.layers.76.input_layernorm.bias": "model-00155-of-00189.safetensors",
+ "model.layers.76.input_layernorm.weight": "model-00155-of-00189.safetensors",
+ "model.layers.76.mlp.down_proj.weight": "model-00155-of-00189.safetensors",
+ "model.layers.76.mlp.down_proj.weight_scale": "model-00155-of-00189.safetensors",
+ "model.layers.76.mlp.up_proj.weight": "model-00154-of-00189.safetensors",
+ "model.layers.76.mlp.up_proj.weight_scale": "model-00154-of-00189.safetensors",
+ "model.layers.76.post_attention_layernorm.bias": "model-00155-of-00189.safetensors",
+ "model.layers.76.post_attention_layernorm.weight": "model-00155-of-00189.safetensors",
+ "model.layers.76.self_attn.k_proj.weight": "model-00153-of-00189.safetensors",
+ "model.layers.76.self_attn.k_proj.weight_scale": "model-00153-of-00189.safetensors",
+ "model.layers.76.self_attn.o_proj.weight": "model-00153-of-00189.safetensors",
+ "model.layers.76.self_attn.o_proj.weight_scale": "model-00153-of-00189.safetensors",
+ "model.layers.76.self_attn.q_proj.weight": "model-00153-of-00189.safetensors",
+ "model.layers.76.self_attn.q_proj.weight_scale": "model-00153-of-00189.safetensors",
+ "model.layers.76.self_attn.v_proj.weight": "model-00153-of-00189.safetensors",
+ "model.layers.76.self_attn.v_proj.weight_scale": "model-00153-of-00189.safetensors",
+ "model.layers.77.input_layernorm.bias": "model-00157-of-00189.safetensors",
+ "model.layers.77.input_layernorm.weight": "model-00157-of-00189.safetensors",
+ "model.layers.77.mlp.down_proj.weight": "model-00157-of-00189.safetensors",
+ "model.layers.77.mlp.down_proj.weight_scale": "model-00157-of-00189.safetensors",
+ "model.layers.77.mlp.up_proj.weight": "model-00156-of-00189.safetensors",
+ "model.layers.77.mlp.up_proj.weight_scale": "model-00156-of-00189.safetensors",
+ "model.layers.77.post_attention_layernorm.bias": "model-00157-of-00189.safetensors",
+ "model.layers.77.post_attention_layernorm.weight": "model-00157-of-00189.safetensors",
+ "model.layers.77.self_attn.k_proj.weight": "model-00155-of-00189.safetensors",
+ "model.layers.77.self_attn.k_proj.weight_scale": "model-00155-of-00189.safetensors",
+ "model.layers.77.self_attn.o_proj.weight": "model-00155-of-00189.safetensors",
+ "model.layers.77.self_attn.o_proj.weight_scale": "model-00155-of-00189.safetensors",
+ "model.layers.77.self_attn.q_proj.weight": "model-00155-of-00189.safetensors",
+ "model.layers.77.self_attn.q_proj.weight_scale": "model-00155-of-00189.safetensors",
+ "model.layers.77.self_attn.v_proj.weight": "model-00155-of-00189.safetensors",
+ "model.layers.77.self_attn.v_proj.weight_scale": "model-00155-of-00189.safetensors",
+ "model.layers.78.input_layernorm.bias": "model-00159-of-00189.safetensors",
+ "model.layers.78.input_layernorm.weight": "model-00159-of-00189.safetensors",
+ "model.layers.78.mlp.down_proj.weight": "model-00159-of-00189.safetensors",
+ "model.layers.78.mlp.down_proj.weight_scale": "model-00159-of-00189.safetensors",
+ "model.layers.78.mlp.up_proj.weight": "model-00158-of-00189.safetensors",
+ "model.layers.78.mlp.up_proj.weight_scale": "model-00158-of-00189.safetensors",
+ "model.layers.78.post_attention_layernorm.bias": "model-00159-of-00189.safetensors",
+ "model.layers.78.post_attention_layernorm.weight": "model-00159-of-00189.safetensors",
+ "model.layers.78.self_attn.k_proj.weight": "model-00157-of-00189.safetensors",
+ "model.layers.78.self_attn.k_proj.weight_scale": "model-00157-of-00189.safetensors",
+ "model.layers.78.self_attn.o_proj.weight": "model-00157-of-00189.safetensors",
+ "model.layers.78.self_attn.o_proj.weight_scale": "model-00157-of-00189.safetensors",
+ "model.layers.78.self_attn.q_proj.weight": "model-00157-of-00189.safetensors",
+ "model.layers.78.self_attn.q_proj.weight_scale": "model-00157-of-00189.safetensors",
+ "model.layers.78.self_attn.v_proj.weight": "model-00157-of-00189.safetensors",
+ "model.layers.78.self_attn.v_proj.weight_scale": "model-00157-of-00189.safetensors",
+ "model.layers.79.input_layernorm.bias": "model-00161-of-00189.safetensors",
+ "model.layers.79.input_layernorm.weight": "model-00161-of-00189.safetensors",
+ "model.layers.79.mlp.down_proj.weight": "model-00161-of-00189.safetensors",
+ "model.layers.79.mlp.down_proj.weight_scale": "model-00161-of-00189.safetensors",
+ "model.layers.79.mlp.up_proj.weight": "model-00160-of-00189.safetensors",
+ "model.layers.79.mlp.up_proj.weight_scale": "model-00160-of-00189.safetensors",
+ "model.layers.79.post_attention_layernorm.bias": "model-00161-of-00189.safetensors",
+ "model.layers.79.post_attention_layernorm.weight": "model-00161-of-00189.safetensors",
+ "model.layers.79.self_attn.k_proj.weight": "model-00159-of-00189.safetensors",
+ "model.layers.79.self_attn.k_proj.weight_scale": "model-00159-of-00189.safetensors",
+ "model.layers.79.self_attn.o_proj.weight": "model-00159-of-00189.safetensors",
+ "model.layers.79.self_attn.o_proj.weight_scale": "model-00159-of-00189.safetensors",
+ "model.layers.79.self_attn.q_proj.weight": "model-00159-of-00189.safetensors",
+ "model.layers.79.self_attn.q_proj.weight_scale": "model-00159-of-00189.safetensors",
+ "model.layers.79.self_attn.v_proj.weight": "model-00159-of-00189.safetensors",
+ "model.layers.79.self_attn.v_proj.weight_scale": "model-00159-of-00189.safetensors",
+ "model.layers.8.input_layernorm.bias": "model-00019-of-00189.safetensors",
+ "model.layers.8.input_layernorm.weight": "model-00019-of-00189.safetensors",
+ "model.layers.8.mlp.down_proj.weight": "model-00019-of-00189.safetensors",
+ "model.layers.8.mlp.down_proj.weight_scale": "model-00019-of-00189.safetensors",
+ "model.layers.8.mlp.up_proj.weight": "model-00018-of-00189.safetensors",
+ "model.layers.8.mlp.up_proj.weight_scale": "model-00018-of-00189.safetensors",
+ "model.layers.8.post_attention_layernorm.bias": "model-00019-of-00189.safetensors",
+ "model.layers.8.post_attention_layernorm.weight": "model-00019-of-00189.safetensors",
+ "model.layers.8.self_attn.k_proj.weight": "model-00017-of-00189.safetensors",
+ "model.layers.8.self_attn.k_proj.weight_scale": "model-00017-of-00189.safetensors",
+ "model.layers.8.self_attn.o_proj.weight": "model-00017-of-00189.safetensors",
+ "model.layers.8.self_attn.o_proj.weight_scale": "model-00017-of-00189.safetensors",
+ "model.layers.8.self_attn.q_proj.weight": "model-00017-of-00189.safetensors",
+ "model.layers.8.self_attn.q_proj.weight_scale": "model-00017-of-00189.safetensors",
+ "model.layers.8.self_attn.v_proj.weight": "model-00017-of-00189.safetensors",
+ "model.layers.8.self_attn.v_proj.weight_scale": "model-00017-of-00189.safetensors",
+ "model.layers.80.input_layernorm.bias": "model-00163-of-00189.safetensors",
+ "model.layers.80.input_layernorm.weight": "model-00163-of-00189.safetensors",
+ "model.layers.80.mlp.down_proj.weight": "model-00163-of-00189.safetensors",
+ "model.layers.80.mlp.down_proj.weight_scale": "model-00163-of-00189.safetensors",
+ "model.layers.80.mlp.up_proj.weight": "model-00162-of-00189.safetensors",
+ "model.layers.80.mlp.up_proj.weight_scale": "model-00162-of-00189.safetensors",
+ "model.layers.80.post_attention_layernorm.bias": "model-00163-of-00189.safetensors",
+ "model.layers.80.post_attention_layernorm.weight": "model-00163-of-00189.safetensors",
+ "model.layers.80.self_attn.k_proj.weight": "model-00161-of-00189.safetensors",
+ "model.layers.80.self_attn.k_proj.weight_scale": "model-00161-of-00189.safetensors",
+ "model.layers.80.self_attn.o_proj.weight": "model-00161-of-00189.safetensors",
+ "model.layers.80.self_attn.o_proj.weight_scale": "model-00161-of-00189.safetensors",
+ "model.layers.80.self_attn.q_proj.weight": "model-00161-of-00189.safetensors",
+ "model.layers.80.self_attn.q_proj.weight_scale": "model-00161-of-00189.safetensors",
+ "model.layers.80.self_attn.v_proj.weight": "model-00161-of-00189.safetensors",
+ "model.layers.80.self_attn.v_proj.weight_scale": "model-00161-of-00189.safetensors",
+ "model.layers.81.input_layernorm.bias": "model-00165-of-00189.safetensors",
+ "model.layers.81.input_layernorm.weight": "model-00165-of-00189.safetensors",
+ "model.layers.81.mlp.down_proj.weight": "model-00165-of-00189.safetensors",
+ "model.layers.81.mlp.down_proj.weight_scale": "model-00165-of-00189.safetensors",
+ "model.layers.81.mlp.up_proj.weight": "model-00164-of-00189.safetensors",
+ "model.layers.81.mlp.up_proj.weight_scale": "model-00164-of-00189.safetensors",
+ "model.layers.81.post_attention_layernorm.bias": "model-00165-of-00189.safetensors",
+ "model.layers.81.post_attention_layernorm.weight": "model-00165-of-00189.safetensors",
+ "model.layers.81.self_attn.k_proj.weight": "model-00163-of-00189.safetensors",
+ "model.layers.81.self_attn.k_proj.weight_scale": "model-00163-of-00189.safetensors",
+ "model.layers.81.self_attn.o_proj.weight": "model-00163-of-00189.safetensors",
+ "model.layers.81.self_attn.o_proj.weight_scale": "model-00163-of-00189.safetensors",
+ "model.layers.81.self_attn.q_proj.weight": "model-00163-of-00189.safetensors",
+ "model.layers.81.self_attn.q_proj.weight_scale": "model-00163-of-00189.safetensors",
+ "model.layers.81.self_attn.v_proj.weight": "model-00163-of-00189.safetensors",
+ "model.layers.81.self_attn.v_proj.weight_scale": "model-00163-of-00189.safetensors",
+ "model.layers.82.input_layernorm.bias": "model-00167-of-00189.safetensors",
+ "model.layers.82.input_layernorm.weight": "model-00167-of-00189.safetensors",
+ "model.layers.82.mlp.down_proj.weight": "model-00167-of-00189.safetensors",
+ "model.layers.82.mlp.down_proj.weight_scale": "model-00167-of-00189.safetensors",
+ "model.layers.82.mlp.up_proj.weight": "model-00166-of-00189.safetensors",
+ "model.layers.82.mlp.up_proj.weight_scale": "model-00166-of-00189.safetensors",
+ "model.layers.82.post_attention_layernorm.bias": "model-00167-of-00189.safetensors",
+ "model.layers.82.post_attention_layernorm.weight": "model-00167-of-00189.safetensors",
+ "model.layers.82.self_attn.k_proj.weight": "model-00165-of-00189.safetensors",
+ "model.layers.82.self_attn.k_proj.weight_scale": "model-00165-of-00189.safetensors",
+ "model.layers.82.self_attn.o_proj.weight": "model-00165-of-00189.safetensors",
+ "model.layers.82.self_attn.o_proj.weight_scale": "model-00165-of-00189.safetensors",
+ "model.layers.82.self_attn.q_proj.weight": "model-00165-of-00189.safetensors",
+ "model.layers.82.self_attn.q_proj.weight_scale": "model-00165-of-00189.safetensors",
+ "model.layers.82.self_attn.v_proj.weight": "model-00165-of-00189.safetensors",
+ "model.layers.82.self_attn.v_proj.weight_scale": "model-00165-of-00189.safetensors",
+ "model.layers.83.input_layernorm.bias": "model-00169-of-00189.safetensors",
+ "model.layers.83.input_layernorm.weight": "model-00169-of-00189.safetensors",
+ "model.layers.83.mlp.down_proj.weight": "model-00169-of-00189.safetensors",
+ "model.layers.83.mlp.down_proj.weight_scale": "model-00169-of-00189.safetensors",
+ "model.layers.83.mlp.up_proj.weight": "model-00168-of-00189.safetensors",
+ "model.layers.83.mlp.up_proj.weight_scale": "model-00168-of-00189.safetensors",
+ "model.layers.83.post_attention_layernorm.bias": "model-00169-of-00189.safetensors",
+ "model.layers.83.post_attention_layernorm.weight": "model-00169-of-00189.safetensors",
+ "model.layers.83.self_attn.k_proj.weight": "model-00167-of-00189.safetensors",
+ "model.layers.83.self_attn.k_proj.weight_scale": "model-00167-of-00189.safetensors",
+ "model.layers.83.self_attn.o_proj.weight": "model-00167-of-00189.safetensors",
+ "model.layers.83.self_attn.o_proj.weight_scale": "model-00167-of-00189.safetensors",
+ "model.layers.83.self_attn.q_proj.weight": "model-00167-of-00189.safetensors",
+ "model.layers.83.self_attn.q_proj.weight_scale": "model-00167-of-00189.safetensors",
+ "model.layers.83.self_attn.v_proj.weight": "model-00167-of-00189.safetensors",
+ "model.layers.83.self_attn.v_proj.weight_scale": "model-00167-of-00189.safetensors",
+ "model.layers.84.input_layernorm.bias": "model-00171-of-00189.safetensors",
+ "model.layers.84.input_layernorm.weight": "model-00171-of-00189.safetensors",
+ "model.layers.84.mlp.down_proj.weight": "model-00171-of-00189.safetensors",
+ "model.layers.84.mlp.down_proj.weight_scale": "model-00171-of-00189.safetensors",
+ "model.layers.84.mlp.up_proj.weight": "model-00170-of-00189.safetensors",
+ "model.layers.84.mlp.up_proj.weight_scale": "model-00170-of-00189.safetensors",
+ "model.layers.84.post_attention_layernorm.bias": "model-00171-of-00189.safetensors",
+ "model.layers.84.post_attention_layernorm.weight": "model-00171-of-00189.safetensors",
+ "model.layers.84.self_attn.k_proj.weight": "model-00169-of-00189.safetensors",
+ "model.layers.84.self_attn.k_proj.weight_scale": "model-00169-of-00189.safetensors",
+ "model.layers.84.self_attn.o_proj.weight": "model-00169-of-00189.safetensors",
+ "model.layers.84.self_attn.o_proj.weight_scale": "model-00169-of-00189.safetensors",
+ "model.layers.84.self_attn.q_proj.weight": "model-00169-of-00189.safetensors",
+ "model.layers.84.self_attn.q_proj.weight_scale": "model-00169-of-00189.safetensors",
+ "model.layers.84.self_attn.v_proj.weight": "model-00169-of-00189.safetensors",
+ "model.layers.84.self_attn.v_proj.weight_scale": "model-00169-of-00189.safetensors",
+ "model.layers.85.input_layernorm.bias": "model-00173-of-00189.safetensors",
+ "model.layers.85.input_layernorm.weight": "model-00173-of-00189.safetensors",
+ "model.layers.85.mlp.down_proj.weight": "model-00173-of-00189.safetensors",
+ "model.layers.85.mlp.down_proj.weight_scale": "model-00173-of-00189.safetensors",
+ "model.layers.85.mlp.up_proj.weight": "model-00172-of-00189.safetensors",
+ "model.layers.85.mlp.up_proj.weight_scale": "model-00172-of-00189.safetensors",
+ "model.layers.85.post_attention_layernorm.bias": "model-00173-of-00189.safetensors",
+ "model.layers.85.post_attention_layernorm.weight": "model-00173-of-00189.safetensors",
+ "model.layers.85.self_attn.k_proj.weight": "model-00171-of-00189.safetensors",
+ "model.layers.85.self_attn.k_proj.weight_scale": "model-00171-of-00189.safetensors",
+ "model.layers.85.self_attn.o_proj.weight": "model-00171-of-00189.safetensors",
+ "model.layers.85.self_attn.o_proj.weight_scale": "model-00171-of-00189.safetensors",
+ "model.layers.85.self_attn.q_proj.weight": "model-00171-of-00189.safetensors",
+ "model.layers.85.self_attn.q_proj.weight_scale": "model-00171-of-00189.safetensors",
+ "model.layers.85.self_attn.v_proj.weight": "model-00171-of-00189.safetensors",
+ "model.layers.85.self_attn.v_proj.weight_scale": "model-00171-of-00189.safetensors",
+ "model.layers.86.input_layernorm.bias": "model-00175-of-00189.safetensors",
+ "model.layers.86.input_layernorm.weight": "model-00175-of-00189.safetensors",
+ "model.layers.86.mlp.down_proj.weight": "model-00175-of-00189.safetensors",
+ "model.layers.86.mlp.down_proj.weight_scale": "model-00175-of-00189.safetensors",
+ "model.layers.86.mlp.up_proj.weight": "model-00174-of-00189.safetensors",
+ "model.layers.86.mlp.up_proj.weight_scale": "model-00174-of-00189.safetensors",
+ "model.layers.86.post_attention_layernorm.bias": "model-00175-of-00189.safetensors",
+ "model.layers.86.post_attention_layernorm.weight": "model-00175-of-00189.safetensors",
+ "model.layers.86.self_attn.k_proj.weight": "model-00173-of-00189.safetensors",
+ "model.layers.86.self_attn.k_proj.weight_scale": "model-00173-of-00189.safetensors",
+ "model.layers.86.self_attn.o_proj.weight": "model-00173-of-00189.safetensors",
+ "model.layers.86.self_attn.o_proj.weight_scale": "model-00173-of-00189.safetensors",
+ "model.layers.86.self_attn.q_proj.weight": "model-00173-of-00189.safetensors",
+ "model.layers.86.self_attn.q_proj.weight_scale": "model-00173-of-00189.safetensors",
+ "model.layers.86.self_attn.v_proj.weight": "model-00173-of-00189.safetensors",
+ "model.layers.86.self_attn.v_proj.weight_scale": "model-00173-of-00189.safetensors",
+ "model.layers.87.input_layernorm.bias": "model-00177-of-00189.safetensors",
+ "model.layers.87.input_layernorm.weight": "model-00177-of-00189.safetensors",
+ "model.layers.87.mlp.down_proj.weight": "model-00177-of-00189.safetensors",
+ "model.layers.87.mlp.down_proj.weight_scale": "model-00177-of-00189.safetensors",
+ "model.layers.87.mlp.up_proj.weight": "model-00176-of-00189.safetensors",
+ "model.layers.87.mlp.up_proj.weight_scale": "model-00176-of-00189.safetensors",
+ "model.layers.87.post_attention_layernorm.bias": "model-00177-of-00189.safetensors",
+ "model.layers.87.post_attention_layernorm.weight": "model-00177-of-00189.safetensors",
+ "model.layers.87.self_attn.k_proj.weight": "model-00175-of-00189.safetensors",
+ "model.layers.87.self_attn.k_proj.weight_scale": "model-00175-of-00189.safetensors",
+ "model.layers.87.self_attn.o_proj.weight": "model-00175-of-00189.safetensors",
+ "model.layers.87.self_attn.o_proj.weight_scale": "model-00175-of-00189.safetensors",
+ "model.layers.87.self_attn.q_proj.weight": "model-00175-of-00189.safetensors",
+ "model.layers.87.self_attn.q_proj.weight_scale": "model-00175-of-00189.safetensors",
+ "model.layers.87.self_attn.v_proj.weight": "model-00175-of-00189.safetensors",
+ "model.layers.87.self_attn.v_proj.weight_scale": "model-00175-of-00189.safetensors",
+ "model.layers.88.input_layernorm.bias": "model-00179-of-00189.safetensors",
+ "model.layers.88.input_layernorm.weight": "model-00179-of-00189.safetensors",
+ "model.layers.88.mlp.down_proj.weight": "model-00179-of-00189.safetensors",
+ "model.layers.88.mlp.down_proj.weight_scale": "model-00179-of-00189.safetensors",
+ "model.layers.88.mlp.up_proj.weight": "model-00178-of-00189.safetensors",
+ "model.layers.88.mlp.up_proj.weight_scale": "model-00178-of-00189.safetensors",
+ "model.layers.88.post_attention_layernorm.bias": "model-00179-of-00189.safetensors",
+ "model.layers.88.post_attention_layernorm.weight": "model-00179-of-00189.safetensors",
+ "model.layers.88.self_attn.k_proj.weight": "model-00177-of-00189.safetensors",
+ "model.layers.88.self_attn.k_proj.weight_scale": "model-00177-of-00189.safetensors",
+ "model.layers.88.self_attn.o_proj.weight": "model-00177-of-00189.safetensors",
+ "model.layers.88.self_attn.o_proj.weight_scale": "model-00177-of-00189.safetensors",
+ "model.layers.88.self_attn.q_proj.weight": "model-00177-of-00189.safetensors",
+ "model.layers.88.self_attn.q_proj.weight_scale": "model-00177-of-00189.safetensors",
+ "model.layers.88.self_attn.v_proj.weight": "model-00177-of-00189.safetensors",
+ "model.layers.88.self_attn.v_proj.weight_scale": "model-00177-of-00189.safetensors",
+ "model.layers.89.input_layernorm.bias": "model-00181-of-00189.safetensors",
+ "model.layers.89.input_layernorm.weight": "model-00181-of-00189.safetensors",
+ "model.layers.89.mlp.down_proj.weight": "model-00181-of-00189.safetensors",
+ "model.layers.89.mlp.down_proj.weight_scale": "model-00181-of-00189.safetensors",
+ "model.layers.89.mlp.up_proj.weight": "model-00180-of-00189.safetensors",
+ "model.layers.89.mlp.up_proj.weight_scale": "model-00180-of-00189.safetensors",
+ "model.layers.89.post_attention_layernorm.bias": "model-00181-of-00189.safetensors",
+ "model.layers.89.post_attention_layernorm.weight": "model-00181-of-00189.safetensors",
+ "model.layers.89.self_attn.k_proj.weight": "model-00179-of-00189.safetensors",
+ "model.layers.89.self_attn.k_proj.weight_scale": "model-00179-of-00189.safetensors",
+ "model.layers.89.self_attn.o_proj.weight": "model-00179-of-00189.safetensors",
+ "model.layers.89.self_attn.o_proj.weight_scale": "model-00179-of-00189.safetensors",
+ "model.layers.89.self_attn.q_proj.weight": "model-00179-of-00189.safetensors",
+ "model.layers.89.self_attn.q_proj.weight_scale": "model-00179-of-00189.safetensors",
+ "model.layers.89.self_attn.v_proj.weight": "model-00179-of-00189.safetensors",
+ "model.layers.89.self_attn.v_proj.weight_scale": "model-00179-of-00189.safetensors",
+ "model.layers.9.input_layernorm.bias": "model-00021-of-00189.safetensors",
+ "model.layers.9.input_layernorm.weight": "model-00021-of-00189.safetensors",
+ "model.layers.9.mlp.down_proj.weight": "model-00021-of-00189.safetensors",
+ "model.layers.9.mlp.down_proj.weight_scale": "model-00021-of-00189.safetensors",
+ "model.layers.9.mlp.up_proj.weight": "model-00020-of-00189.safetensors",
+ "model.layers.9.mlp.up_proj.weight_scale": "model-00020-of-00189.safetensors",
+ "model.layers.9.post_attention_layernorm.bias": "model-00021-of-00189.safetensors",
+ "model.layers.9.post_attention_layernorm.weight": "model-00021-of-00189.safetensors",
+ "model.layers.9.self_attn.k_proj.weight": "model-00019-of-00189.safetensors",
+ "model.layers.9.self_attn.k_proj.weight_scale": "model-00019-of-00189.safetensors",
+ "model.layers.9.self_attn.o_proj.weight": "model-00019-of-00189.safetensors",
+ "model.layers.9.self_attn.o_proj.weight_scale": "model-00019-of-00189.safetensors",
+ "model.layers.9.self_attn.q_proj.weight": "model-00019-of-00189.safetensors",
+ "model.layers.9.self_attn.q_proj.weight_scale": "model-00019-of-00189.safetensors",
+ "model.layers.9.self_attn.v_proj.weight": "model-00019-of-00189.safetensors",
+ "model.layers.9.self_attn.v_proj.weight_scale": "model-00019-of-00189.safetensors",
+ "model.layers.90.input_layernorm.bias": "model-00183-of-00189.safetensors",
+ "model.layers.90.input_layernorm.weight": "model-00183-of-00189.safetensors",
+ "model.layers.90.mlp.down_proj.weight": "model-00183-of-00189.safetensors",
+ "model.layers.90.mlp.down_proj.weight_scale": "model-00183-of-00189.safetensors",
+ "model.layers.90.mlp.up_proj.weight": "model-00182-of-00189.safetensors",
+ "model.layers.90.mlp.up_proj.weight_scale": "model-00182-of-00189.safetensors",
+ "model.layers.90.post_attention_layernorm.bias": "model-00183-of-00189.safetensors",
+ "model.layers.90.post_attention_layernorm.weight": "model-00183-of-00189.safetensors",
+ "model.layers.90.self_attn.k_proj.weight": "model-00181-of-00189.safetensors",
+ "model.layers.90.self_attn.k_proj.weight_scale": "model-00181-of-00189.safetensors",
+ "model.layers.90.self_attn.o_proj.weight": "model-00181-of-00189.safetensors",
+ "model.layers.90.self_attn.o_proj.weight_scale": "model-00181-of-00189.safetensors",
+ "model.layers.90.self_attn.q_proj.weight": "model-00181-of-00189.safetensors",
+ "model.layers.90.self_attn.q_proj.weight_scale": "model-00181-of-00189.safetensors",
+ "model.layers.90.self_attn.v_proj.weight": "model-00181-of-00189.safetensors",
+ "model.layers.90.self_attn.v_proj.weight_scale": "model-00181-of-00189.safetensors",
+ "model.layers.91.input_layernorm.bias": "model-00185-of-00189.safetensors",
+ "model.layers.91.input_layernorm.weight": "model-00185-of-00189.safetensors",
+ "model.layers.91.mlp.down_proj.weight": "model-00185-of-00189.safetensors",
+ "model.layers.91.mlp.down_proj.weight_scale": "model-00185-of-00189.safetensors",
+ "model.layers.91.mlp.up_proj.weight": "model-00184-of-00189.safetensors",
+ "model.layers.91.mlp.up_proj.weight_scale": "model-00184-of-00189.safetensors",
+ "model.layers.91.post_attention_layernorm.bias": "model-00185-of-00189.safetensors",
+ "model.layers.91.post_attention_layernorm.weight": "model-00185-of-00189.safetensors",
+ "model.layers.91.self_attn.k_proj.weight": "model-00183-of-00189.safetensors",
+ "model.layers.91.self_attn.k_proj.weight_scale": "model-00183-of-00189.safetensors",
+ "model.layers.91.self_attn.o_proj.weight": "model-00183-of-00189.safetensors",
+ "model.layers.91.self_attn.o_proj.weight_scale": "model-00183-of-00189.safetensors",
+ "model.layers.91.self_attn.q_proj.weight": "model-00183-of-00189.safetensors",
+ "model.layers.91.self_attn.q_proj.weight_scale": "model-00183-of-00189.safetensors",
+ "model.layers.91.self_attn.v_proj.weight": "model-00183-of-00189.safetensors",
+ "model.layers.91.self_attn.v_proj.weight_scale": "model-00183-of-00189.safetensors",
+ "model.layers.92.input_layernorm.bias": "model-00187-of-00189.safetensors",
+ "model.layers.92.input_layernorm.weight": "model-00187-of-00189.safetensors",
+ "model.layers.92.mlp.down_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.92.mlp.down_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.92.mlp.up_proj.weight": "model-00186-of-00189.safetensors",
+ "model.layers.92.mlp.up_proj.weight_scale": "model-00186-of-00189.safetensors",
+ "model.layers.92.post_attention_layernorm.bias": "model-00187-of-00189.safetensors",
+ "model.layers.92.post_attention_layernorm.weight": "model-00187-of-00189.safetensors",
+ "model.layers.92.self_attn.k_proj.weight": "model-00185-of-00189.safetensors",
+ "model.layers.92.self_attn.k_proj.weight_scale": "model-00185-of-00189.safetensors",
+ "model.layers.92.self_attn.o_proj.weight": "model-00185-of-00189.safetensors",
+ "model.layers.92.self_attn.o_proj.weight_scale": "model-00185-of-00189.safetensors",
+ "model.layers.92.self_attn.q_proj.weight": "model-00185-of-00189.safetensors",
+ "model.layers.92.self_attn.q_proj.weight_scale": "model-00185-of-00189.safetensors",
+ "model.layers.92.self_attn.v_proj.weight": "model-00185-of-00189.safetensors",
+ "model.layers.92.self_attn.v_proj.weight_scale": "model-00185-of-00189.safetensors",
+ "model.layers.93.input_layernorm.bias": "model-00189-of-00189.safetensors",
+ "model.layers.93.input_layernorm.weight": "model-00189-of-00189.safetensors",
+ "model.layers.93.mlp.down_proj.weight": "model-00189-of-00189.safetensors",
+ "model.layers.93.mlp.down_proj.weight_scale": "model-00189-of-00189.safetensors",
+ "model.layers.93.mlp.up_proj.weight": "model-00189-of-00189.safetensors",
+ "model.layers.93.mlp.up_proj.weight_scale": "model-00189-of-00189.safetensors",
+ "model.layers.93.post_attention_layernorm.bias": "model-00189-of-00189.safetensors",
+ "model.layers.93.post_attention_layernorm.weight": "model-00189-of-00189.safetensors",
+ "model.layers.93.self_attn.k_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.93.self_attn.k_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.93.self_attn.o_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.93.self_attn.o_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.93.self_attn.q_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.93.self_attn.q_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.93.self_attn.v_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.93.self_attn.v_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.94.input_layernorm.bias": "model-00189-of-00189.safetensors",
+ "model.layers.94.input_layernorm.weight": "model-00189-of-00189.safetensors",
+ "model.layers.94.mlp.down_proj.weight": "model-00189-of-00189.safetensors",
+ "model.layers.94.mlp.down_proj.weight_scale": "model-00189-of-00189.safetensors",
+ "model.layers.94.mlp.up_proj.weight": "model-00189-of-00189.safetensors",
+ "model.layers.94.mlp.up_proj.weight_scale": "model-00189-of-00189.safetensors",
+ "model.layers.94.post_attention_layernorm.bias": "model-00189-of-00189.safetensors",
+ "model.layers.94.post_attention_layernorm.weight": "model-00189-of-00189.safetensors",
+ "model.layers.94.self_attn.k_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.94.self_attn.k_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.94.self_attn.o_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.94.self_attn.o_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.94.self_attn.q_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.94.self_attn.q_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.94.self_attn.v_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.94.self_attn.v_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.95.input_layernorm.bias": "model-00189-of-00189.safetensors",
+ "model.layers.95.input_layernorm.weight": "model-00189-of-00189.safetensors",
+ "model.layers.95.mlp.down_proj.weight": "model-00189-of-00189.safetensors",
+ "model.layers.95.mlp.down_proj.weight_scale": "model-00189-of-00189.safetensors",
+ "model.layers.95.mlp.up_proj.weight": "model-00189-of-00189.safetensors",
+ "model.layers.95.mlp.up_proj.weight_scale": "model-00189-of-00189.safetensors",
+ "model.layers.95.post_attention_layernorm.bias": "model-00189-of-00189.safetensors",
+ "model.layers.95.post_attention_layernorm.weight": "model-00189-of-00189.safetensors",
+ "model.layers.95.self_attn.k_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.95.self_attn.k_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.95.self_attn.o_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.95.self_attn.o_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.95.self_attn.q_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.95.self_attn.q_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.layers.95.self_attn.v_proj.weight": "model-00187-of-00189.safetensors",
+ "model.layers.95.self_attn.v_proj.weight_scale": "model-00187-of-00189.safetensors",
+ "model.norm.bias": "model-00189-of-00189.safetensors",
+ "model.norm.weight": "model-00189-of-00189.safetensors"
+ }
+}
\ No newline at end of file
diff --git a/special_tokens_map.json b/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..451134b2ddc2e78555d1e857518c54b4bdc2e87d
--- /dev/null
+++ b/special_tokens_map.json
@@ -0,0 +1,23 @@
+{
+ "bos_token": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "eos_token": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "unk_token": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ }
+}
diff --git a/tokenizer.model b/tokenizer.model
new file mode 100644
index 0000000000000000000000000000000000000000..b399c69ef3e792391465e45d07e72ee1fc6acf94
--- /dev/null
+++ b/tokenizer.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6dfd8b970f437002fc445214304969fe59e64d4f48500bd0b77ba55340f2d811
+size 4545602
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..a144cfed4de7d475cc76bf0633884d33b0a86dd7
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,42 @@
+{
+ "add_bos_token": true,
+ "add_eos_token": false,
+ "add_prefix_space": true,
+ "added_tokens_decoder": {
+ "1": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "2": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "3": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ }
+ },
+ "bos_token": "",
+ "clean_up_tokenization_spaces": false,
+ "eos_token": "",
+ "legacy": true,
+ "model_max_length": 1000000000000000019884624838656,
+ "pad_token": null,
+ "sp_model_kwargs": {},
+ "spaces_between_special_tokens": false,
+ "tokenizer_class": "LlamaTokenizer",
+ "unk_token": "",
+ "use_default_system_prompt": false
+}