diff --git a/.gitattributes b/.gitattributes
index d24915691874c1bf94e1d55e820849de88106098..780672f23f4ce7b70bffd3c2e3a54e1cf9c51192 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -36,3 +36,74 @@ tr13-176B-ml-t0-logs/logs/p31lossseq/main_log.txt filter=lfs diff=lfs merge=lfs
 logs/logs/xp3capmixnewcodelonglossseq/main_log.txt filter=lfs diff=lfs merge=lfs -text
 logs/logs/xp3zzlossseq/main_log.txt filter=lfs diff=lfs merge=lfs -text
 logs/logs/p31lossseq/main_log.txt filter=lfs diff=lfs merge=lfs -text
+model_00007-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00035-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00068-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00014-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00060-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00026-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00043-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00041-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00015-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00019-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00013-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00029-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00055-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00056-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00012-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00049-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00027-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00052-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00004-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00037-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00045-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00011-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00067-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00064-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00034-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00005-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00033-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00039-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00042-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00044-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00071-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00053-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00006-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00021-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00036-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00051-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00047-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00024-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00017-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00003-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00023-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00018-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00002-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00016-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00031-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00065-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00022-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00008-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00048-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00063-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00050-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00046-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00009-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00061-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00069-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00070-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00028-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00020-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00025-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00030-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00066-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00032-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00057-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00010-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00058-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00001-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00062-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00038-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00059-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00054-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
+model_00040-of-00072.safetensors filter=lfs diff=lfs merge=lfs -text
diff --git a/model.safetensors.index.json b/model.safetensors.index.json
new file mode 100644
index 0000000000000000000000000000000000000000..89e9ab80d83ceb806a7497d5da7071c38ec0405f
--- /dev/null
+++ b/model.safetensors.index.json
@@ -0,0 +1 @@
+{"metadata": {"total_size": 352494542848}, "weight_map": {"h.0.input_layernorm.bias": "model_00002-of-00072.safetensors", "h.0.input_layernorm.weight": "model_00002-of-00072.safetensors", "h.0.mlp.dense_4h_to_h.bias": "model_00002-of-00072.safetensors", "h.0.mlp.dense_4h_to_h.weight": "model_00002-of-00072.safetensors", "h.0.mlp.dense_h_to_4h.bias": "model_00002-of-00072.safetensors", "h.0.mlp.dense_h_to_4h.weight": "model_00002-of-00072.safetensors", "h.0.post_attention_layernorm.bias": "model_00002-of-00072.safetensors", "h.0.post_attention_layernorm.weight": "model_00002-of-00072.safetensors", "h.0.self_attention.dense.bias": "model_00002-of-00072.safetensors", "h.0.self_attention.dense.weight": "model_00002-of-00072.safetensors", "h.0.self_attention.query_key_value.bias": "model_00002-of-00072.safetensors", "h.0.self_attention.query_key_value.weight": "model_00002-of-00072.safetensors", "h.1.input_layernorm.bias": "model_00003-of-00072.safetensors", "h.1.input_layernorm.weight": "model_00003-of-00072.safetensors", "h.1.mlp.dense_4h_to_h.bias": "model_00003-of-00072.safetensors", "h.1.mlp.dense_4h_to_h.weight": "model_00003-of-00072.safetensors", "h.1.mlp.dense_h_to_4h.bias": "model_00003-of-00072.safetensors", "h.1.mlp.dense_h_to_4h.weight": "model_00003-of-00072.safetensors", "h.1.post_attention_layernorm.bias": "model_00003-of-00072.safetensors", "h.1.post_attention_layernorm.weight": "model_00003-of-00072.safetensors", "h.1.self_attention.dense.bias": "model_00003-of-00072.safetensors", "h.1.self_attention.dense.weight": "model_00003-of-00072.safetensors", "h.1.self_attention.query_key_value.bias": "model_00003-of-00072.safetensors", "h.1.self_attention.query_key_value.weight": "model_00003-of-00072.safetensors", "h.10.input_layernorm.bias": "model_00012-of-00072.safetensors", "h.10.input_layernorm.weight": "model_00012-of-00072.safetensors", "h.10.mlp.dense_4h_to_h.bias": "model_00012-of-00072.safetensors", "h.10.mlp.dense_4h_to_h.weight": "model_00012-of-00072.safetensors", "h.10.mlp.dense_h_to_4h.bias": "model_00012-of-00072.safetensors", "h.10.mlp.dense_h_to_4h.weight": "model_00012-of-00072.safetensors", "h.10.post_attention_layernorm.bias": "model_00012-of-00072.safetensors", "h.10.post_attention_layernorm.weight": "model_00012-of-00072.safetensors", "h.10.self_attention.dense.bias": "model_00012-of-00072.safetensors", "h.10.self_attention.dense.weight": "model_00012-of-00072.safetensors", "h.10.self_attention.query_key_value.bias": "model_00012-of-00072.safetensors", "h.10.self_attention.query_key_value.weight": "model_00012-of-00072.safetensors", "h.11.input_layernorm.bias": "model_00013-of-00072.safetensors", "h.11.input_layernorm.weight": "model_00013-of-00072.safetensors", "h.11.mlp.dense_4h_to_h.bias": "model_00013-of-00072.safetensors", "h.11.mlp.dense_4h_to_h.weight": "model_00013-of-00072.safetensors", "h.11.mlp.dense_h_to_4h.bias": "model_00013-of-00072.safetensors", "h.11.mlp.dense_h_to_4h.weight": "model_00013-of-00072.safetensors", "h.11.post_attention_layernorm.bias": "model_00013-of-00072.safetensors", "h.11.post_attention_layernorm.weight": "model_00013-of-00072.safetensors", "h.11.self_attention.dense.bias": "model_00013-of-00072.safetensors", "h.11.self_attention.dense.weight": "model_00013-of-00072.safetensors", "h.11.self_attention.query_key_value.bias": "model_00013-of-00072.safetensors", "h.11.self_attention.query_key_value.weight": "model_00013-of-00072.safetensors", "h.12.input_layernorm.bias": "model_00014-of-00072.safetensors", "h.12.input_layernorm.weight": "model_00014-of-00072.safetensors", "h.12.mlp.dense_4h_to_h.bias": "model_00014-of-00072.safetensors", "h.12.mlp.dense_4h_to_h.weight": "model_00014-of-00072.safetensors", "h.12.mlp.dense_h_to_4h.bias": "model_00014-of-00072.safetensors", "h.12.mlp.dense_h_to_4h.weight": "model_00014-of-00072.safetensors", "h.12.post_attention_layernorm.bias": "model_00014-of-00072.safetensors", "h.12.post_attention_layernorm.weight": "model_00014-of-00072.safetensors", "h.12.self_attention.dense.bias": "model_00014-of-00072.safetensors", "h.12.self_attention.dense.weight": "model_00014-of-00072.safetensors", "h.12.self_attention.query_key_value.bias": "model_00014-of-00072.safetensors", "h.12.self_attention.query_key_value.weight": "model_00014-of-00072.safetensors", "h.13.input_layernorm.bias": "model_00015-of-00072.safetensors", "h.13.input_layernorm.weight": "model_00015-of-00072.safetensors", "h.13.mlp.dense_4h_to_h.bias": "model_00015-of-00072.safetensors", "h.13.mlp.dense_4h_to_h.weight": "model_00015-of-00072.safetensors", "h.13.mlp.dense_h_to_4h.bias": "model_00015-of-00072.safetensors", "h.13.mlp.dense_h_to_4h.weight": "model_00015-of-00072.safetensors", "h.13.post_attention_layernorm.bias": "model_00015-of-00072.safetensors", "h.13.post_attention_layernorm.weight": "model_00015-of-00072.safetensors", "h.13.self_attention.dense.bias": "model_00015-of-00072.safetensors", "h.13.self_attention.dense.weight": "model_00015-of-00072.safetensors", "h.13.self_attention.query_key_value.bias": "model_00015-of-00072.safetensors", "h.13.self_attention.query_key_value.weight": "model_00015-of-00072.safetensors", "h.14.input_layernorm.bias": "model_00016-of-00072.safetensors", "h.14.input_layernorm.weight": "model_00016-of-00072.safetensors", "h.14.mlp.dense_4h_to_h.bias": "model_00016-of-00072.safetensors", "h.14.mlp.dense_4h_to_h.weight": "model_00016-of-00072.safetensors", "h.14.mlp.dense_h_to_4h.bias": "model_00016-of-00072.safetensors", "h.14.mlp.dense_h_to_4h.weight": "model_00016-of-00072.safetensors", "h.14.post_attention_layernorm.bias": "model_00016-of-00072.safetensors", "h.14.post_attention_layernorm.weight": "model_00016-of-00072.safetensors", "h.14.self_attention.dense.bias": "model_00016-of-00072.safetensors", "h.14.self_attention.dense.weight": "model_00016-of-00072.safetensors", "h.14.self_attention.query_key_value.bias": "model_00016-of-00072.safetensors", "h.14.self_attention.query_key_value.weight": "model_00016-of-00072.safetensors", "h.15.input_layernorm.bias": "model_00017-of-00072.safetensors", "h.15.input_layernorm.weight": "model_00017-of-00072.safetensors", "h.15.mlp.dense_4h_to_h.bias": "model_00017-of-00072.safetensors", "h.15.mlp.dense_4h_to_h.weight": "model_00017-of-00072.safetensors", "h.15.mlp.dense_h_to_4h.bias": "model_00017-of-00072.safetensors", "h.15.mlp.dense_h_to_4h.weight": "model_00017-of-00072.safetensors", "h.15.post_attention_layernorm.bias": "model_00017-of-00072.safetensors", "h.15.post_attention_layernorm.weight": "model_00017-of-00072.safetensors", "h.15.self_attention.dense.bias": "model_00017-of-00072.safetensors", "h.15.self_attention.dense.weight": "model_00017-of-00072.safetensors", "h.15.self_attention.query_key_value.bias": "model_00017-of-00072.safetensors", "h.15.self_attention.query_key_value.weight": "model_00017-of-00072.safetensors", "h.16.input_layernorm.bias": "model_00018-of-00072.safetensors", "h.16.input_layernorm.weight": "model_00018-of-00072.safetensors", "h.16.mlp.dense_4h_to_h.bias": "model_00018-of-00072.safetensors", "h.16.mlp.dense_4h_to_h.weight": "model_00018-of-00072.safetensors", "h.16.mlp.dense_h_to_4h.bias": "model_00018-of-00072.safetensors", "h.16.mlp.dense_h_to_4h.weight": "model_00018-of-00072.safetensors", "h.16.post_attention_layernorm.bias": "model_00018-of-00072.safetensors", "h.16.post_attention_layernorm.weight": "model_00018-of-00072.safetensors", "h.16.self_attention.dense.bias": "model_00018-of-00072.safetensors", "h.16.self_attention.dense.weight": "model_00018-of-00072.safetensors", "h.16.self_attention.query_key_value.bias": "model_00018-of-00072.safetensors", "h.16.self_attention.query_key_value.weight": "model_00018-of-00072.safetensors", "h.17.input_layernorm.bias": "model_00019-of-00072.safetensors", "h.17.input_layernorm.weight": "model_00019-of-00072.safetensors", "h.17.mlp.dense_4h_to_h.bias": "model_00019-of-00072.safetensors", "h.17.mlp.dense_4h_to_h.weight": "model_00019-of-00072.safetensors", "h.17.mlp.dense_h_to_4h.bias": "model_00019-of-00072.safetensors", "h.17.mlp.dense_h_to_4h.weight": "model_00019-of-00072.safetensors", "h.17.post_attention_layernorm.bias": "model_00019-of-00072.safetensors", "h.17.post_attention_layernorm.weight": "model_00019-of-00072.safetensors", "h.17.self_attention.dense.bias": "model_00019-of-00072.safetensors", "h.17.self_attention.dense.weight": "model_00019-of-00072.safetensors", "h.17.self_attention.query_key_value.bias": "model_00019-of-00072.safetensors", "h.17.self_attention.query_key_value.weight": "model_00019-of-00072.safetensors", "h.18.input_layernorm.bias": "model_00020-of-00072.safetensors", "h.18.input_layernorm.weight": "model_00020-of-00072.safetensors", "h.18.mlp.dense_4h_to_h.bias": "model_00020-of-00072.safetensors", "h.18.mlp.dense_4h_to_h.weight": "model_00020-of-00072.safetensors", "h.18.mlp.dense_h_to_4h.bias": "model_00020-of-00072.safetensors", "h.18.mlp.dense_h_to_4h.weight": "model_00020-of-00072.safetensors", "h.18.post_attention_layernorm.bias": "model_00020-of-00072.safetensors", "h.18.post_attention_layernorm.weight": "model_00020-of-00072.safetensors", "h.18.self_attention.dense.bias": "model_00020-of-00072.safetensors", "h.18.self_attention.dense.weight": "model_00020-of-00072.safetensors", "h.18.self_attention.query_key_value.bias": "model_00020-of-00072.safetensors", "h.18.self_attention.query_key_value.weight": "model_00020-of-00072.safetensors", "h.19.input_layernorm.bias": "model_00021-of-00072.safetensors", "h.19.input_layernorm.weight": "model_00021-of-00072.safetensors", "h.19.mlp.dense_4h_to_h.bias": "model_00021-of-00072.safetensors", "h.19.mlp.dense_4h_to_h.weight": "model_00021-of-00072.safetensors", "h.19.mlp.dense_h_to_4h.bias": "model_00021-of-00072.safetensors", "h.19.mlp.dense_h_to_4h.weight": "model_00021-of-00072.safetensors", "h.19.post_attention_layernorm.bias": "model_00021-of-00072.safetensors", "h.19.post_attention_layernorm.weight": "model_00021-of-00072.safetensors", "h.19.self_attention.dense.bias": "model_00021-of-00072.safetensors", "h.19.self_attention.dense.weight": "model_00021-of-00072.safetensors", "h.19.self_attention.query_key_value.bias": "model_00021-of-00072.safetensors", "h.19.self_attention.query_key_value.weight": "model_00021-of-00072.safetensors", "h.2.input_layernorm.bias": "model_00004-of-00072.safetensors", "h.2.input_layernorm.weight": "model_00004-of-00072.safetensors", "h.2.mlp.dense_4h_to_h.bias": "model_00004-of-00072.safetensors", "h.2.mlp.dense_4h_to_h.weight": "model_00004-of-00072.safetensors", "h.2.mlp.dense_h_to_4h.bias": "model_00004-of-00072.safetensors", "h.2.mlp.dense_h_to_4h.weight": "model_00004-of-00072.safetensors", "h.2.post_attention_layernorm.bias": "model_00004-of-00072.safetensors", "h.2.post_attention_layernorm.weight": "model_00004-of-00072.safetensors", "h.2.self_attention.dense.bias": "model_00004-of-00072.safetensors", "h.2.self_attention.dense.weight": "model_00004-of-00072.safetensors", "h.2.self_attention.query_key_value.bias": "model_00004-of-00072.safetensors", "h.2.self_attention.query_key_value.weight": "model_00004-of-00072.safetensors", "h.20.input_layernorm.bias": "model_00022-of-00072.safetensors", "h.20.input_layernorm.weight": "model_00022-of-00072.safetensors", "h.20.mlp.dense_4h_to_h.bias": "model_00022-of-00072.safetensors", "h.20.mlp.dense_4h_to_h.weight": "model_00022-of-00072.safetensors", "h.20.mlp.dense_h_to_4h.bias": "model_00022-of-00072.safetensors", "h.20.mlp.dense_h_to_4h.weight": "model_00022-of-00072.safetensors", "h.20.post_attention_layernorm.bias": "model_00022-of-00072.safetensors", "h.20.post_attention_layernorm.weight": "model_00022-of-00072.safetensors", "h.20.self_attention.dense.bias": "model_00022-of-00072.safetensors", "h.20.self_attention.dense.weight": "model_00022-of-00072.safetensors", "h.20.self_attention.query_key_value.bias": "model_00022-of-00072.safetensors", "h.20.self_attention.query_key_value.weight": "model_00022-of-00072.safetensors", "h.21.input_layernorm.bias": "model_00023-of-00072.safetensors", "h.21.input_layernorm.weight": "model_00023-of-00072.safetensors", "h.21.mlp.dense_4h_to_h.bias": "model_00023-of-00072.safetensors", "h.21.mlp.dense_4h_to_h.weight": "model_00023-of-00072.safetensors", "h.21.mlp.dense_h_to_4h.bias": "model_00023-of-00072.safetensors", "h.21.mlp.dense_h_to_4h.weight": "model_00023-of-00072.safetensors", "h.21.post_attention_layernorm.bias": "model_00023-of-00072.safetensors", "h.21.post_attention_layernorm.weight": "model_00023-of-00072.safetensors", "h.21.self_attention.dense.bias": "model_00023-of-00072.safetensors", "h.21.self_attention.dense.weight": "model_00023-of-00072.safetensors", "h.21.self_attention.query_key_value.bias": "model_00023-of-00072.safetensors", "h.21.self_attention.query_key_value.weight": "model_00023-of-00072.safetensors", "h.22.input_layernorm.bias": "model_00024-of-00072.safetensors", "h.22.input_layernorm.weight": "model_00024-of-00072.safetensors", "h.22.mlp.dense_4h_to_h.bias": "model_00024-of-00072.safetensors", "h.22.mlp.dense_4h_to_h.weight": "model_00024-of-00072.safetensors", "h.22.mlp.dense_h_to_4h.bias": "model_00024-of-00072.safetensors", "h.22.mlp.dense_h_to_4h.weight": "model_00024-of-00072.safetensors", "h.22.post_attention_layernorm.bias": "model_00024-of-00072.safetensors", "h.22.post_attention_layernorm.weight": "model_00024-of-00072.safetensors", "h.22.self_attention.dense.bias": "model_00024-of-00072.safetensors", "h.22.self_attention.dense.weight": "model_00024-of-00072.safetensors", "h.22.self_attention.query_key_value.bias": "model_00024-of-00072.safetensors", "h.22.self_attention.query_key_value.weight": "model_00024-of-00072.safetensors", "h.23.input_layernorm.bias": "model_00025-of-00072.safetensors", "h.23.input_layernorm.weight": "model_00025-of-00072.safetensors", "h.23.mlp.dense_4h_to_h.bias": "model_00025-of-00072.safetensors", "h.23.mlp.dense_4h_to_h.weight": "model_00025-of-00072.safetensors", "h.23.mlp.dense_h_to_4h.bias": "model_00025-of-00072.safetensors", "h.23.mlp.dense_h_to_4h.weight": "model_00025-of-00072.safetensors", "h.23.post_attention_layernorm.bias": "model_00025-of-00072.safetensors", "h.23.post_attention_layernorm.weight": "model_00025-of-00072.safetensors", "h.23.self_attention.dense.bias": "model_00025-of-00072.safetensors", "h.23.self_attention.dense.weight": "model_00025-of-00072.safetensors", "h.23.self_attention.query_key_value.bias": "model_00025-of-00072.safetensors", "h.23.self_attention.query_key_value.weight": "model_00025-of-00072.safetensors", "h.24.input_layernorm.bias": "model_00026-of-00072.safetensors", "h.24.input_layernorm.weight": "model_00026-of-00072.safetensors", "h.24.mlp.dense_4h_to_h.bias": "model_00026-of-00072.safetensors", "h.24.mlp.dense_4h_to_h.weight": "model_00026-of-00072.safetensors", "h.24.mlp.dense_h_to_4h.bias": "model_00026-of-00072.safetensors", "h.24.mlp.dense_h_to_4h.weight": "model_00026-of-00072.safetensors", "h.24.post_attention_layernorm.bias": "model_00026-of-00072.safetensors", "h.24.post_attention_layernorm.weight": "model_00026-of-00072.safetensors", "h.24.self_attention.dense.bias": "model_00026-of-00072.safetensors", "h.24.self_attention.dense.weight": "model_00026-of-00072.safetensors", "h.24.self_attention.query_key_value.bias": "model_00026-of-00072.safetensors", "h.24.self_attention.query_key_value.weight": "model_00026-of-00072.safetensors", "h.25.input_layernorm.bias": "model_00027-of-00072.safetensors", "h.25.input_layernorm.weight": "model_00027-of-00072.safetensors", "h.25.mlp.dense_4h_to_h.bias": "model_00027-of-00072.safetensors", "h.25.mlp.dense_4h_to_h.weight": "model_00027-of-00072.safetensors", "h.25.mlp.dense_h_to_4h.bias": "model_00027-of-00072.safetensors", "h.25.mlp.dense_h_to_4h.weight": "model_00027-of-00072.safetensors", "h.25.post_attention_layernorm.bias": "model_00027-of-00072.safetensors", "h.25.post_attention_layernorm.weight": "model_00027-of-00072.safetensors", "h.25.self_attention.dense.bias": "model_00027-of-00072.safetensors", "h.25.self_attention.dense.weight": "model_00027-of-00072.safetensors", "h.25.self_attention.query_key_value.bias": "model_00027-of-00072.safetensors", "h.25.self_attention.query_key_value.weight": "model_00027-of-00072.safetensors", "h.26.input_layernorm.bias": "model_00028-of-00072.safetensors", "h.26.input_layernorm.weight": "model_00028-of-00072.safetensors", "h.26.mlp.dense_4h_to_h.bias": "model_00028-of-00072.safetensors", "h.26.mlp.dense_4h_to_h.weight": "model_00028-of-00072.safetensors", "h.26.mlp.dense_h_to_4h.bias": "model_00028-of-00072.safetensors", "h.26.mlp.dense_h_to_4h.weight": "model_00028-of-00072.safetensors", "h.26.post_attention_layernorm.bias": "model_00028-of-00072.safetensors", "h.26.post_attention_layernorm.weight": "model_00028-of-00072.safetensors", "h.26.self_attention.dense.bias": "model_00028-of-00072.safetensors", "h.26.self_attention.dense.weight": "model_00028-of-00072.safetensors", "h.26.self_attention.query_key_value.bias": "model_00028-of-00072.safetensors", "h.26.self_attention.query_key_value.weight": "model_00028-of-00072.safetensors", "h.27.input_layernorm.bias": "model_00029-of-00072.safetensors", "h.27.input_layernorm.weight": "model_00029-of-00072.safetensors", "h.27.mlp.dense_4h_to_h.bias": "model_00029-of-00072.safetensors", "h.27.mlp.dense_4h_to_h.weight": "model_00029-of-00072.safetensors", "h.27.mlp.dense_h_to_4h.bias": "model_00029-of-00072.safetensors", "h.27.mlp.dense_h_to_4h.weight": "model_00029-of-00072.safetensors", "h.27.post_attention_layernorm.bias": "model_00029-of-00072.safetensors", "h.27.post_attention_layernorm.weight": "model_00029-of-00072.safetensors", "h.27.self_attention.dense.bias": "model_00029-of-00072.safetensors", "h.27.self_attention.dense.weight": "model_00029-of-00072.safetensors", "h.27.self_attention.query_key_value.bias": "model_00029-of-00072.safetensors", "h.27.self_attention.query_key_value.weight": "model_00029-of-00072.safetensors", "h.28.input_layernorm.bias": "model_00030-of-00072.safetensors", "h.28.input_layernorm.weight": "model_00030-of-00072.safetensors", "h.28.mlp.dense_4h_to_h.bias": "model_00030-of-00072.safetensors", "h.28.mlp.dense_4h_to_h.weight": "model_00030-of-00072.safetensors", "h.28.mlp.dense_h_to_4h.bias": "model_00030-of-00072.safetensors", "h.28.mlp.dense_h_to_4h.weight": "model_00030-of-00072.safetensors", "h.28.post_attention_layernorm.bias": "model_00030-of-00072.safetensors", "h.28.post_attention_layernorm.weight": "model_00030-of-00072.safetensors", "h.28.self_attention.dense.bias": "model_00030-of-00072.safetensors", "h.28.self_attention.dense.weight": "model_00030-of-00072.safetensors", "h.28.self_attention.query_key_value.bias": "model_00030-of-00072.safetensors", "h.28.self_attention.query_key_value.weight": "model_00030-of-00072.safetensors", "h.29.input_layernorm.bias": "model_00031-of-00072.safetensors", "h.29.input_layernorm.weight": "model_00031-of-00072.safetensors", "h.29.mlp.dense_4h_to_h.bias": "model_00031-of-00072.safetensors", "h.29.mlp.dense_4h_to_h.weight": "model_00031-of-00072.safetensors", "h.29.mlp.dense_h_to_4h.bias": "model_00031-of-00072.safetensors", "h.29.mlp.dense_h_to_4h.weight": "model_00031-of-00072.safetensors", "h.29.post_attention_layernorm.bias": "model_00031-of-00072.safetensors", "h.29.post_attention_layernorm.weight": "model_00031-of-00072.safetensors", "h.29.self_attention.dense.bias": "model_00031-of-00072.safetensors", "h.29.self_attention.dense.weight": "model_00031-of-00072.safetensors", "h.29.self_attention.query_key_value.bias": "model_00031-of-00072.safetensors", "h.29.self_attention.query_key_value.weight": "model_00031-of-00072.safetensors", "h.3.input_layernorm.bias": "model_00005-of-00072.safetensors", "h.3.input_layernorm.weight": "model_00005-of-00072.safetensors", "h.3.mlp.dense_4h_to_h.bias": "model_00005-of-00072.safetensors", "h.3.mlp.dense_4h_to_h.weight": "model_00005-of-00072.safetensors", "h.3.mlp.dense_h_to_4h.bias": "model_00005-of-00072.safetensors", "h.3.mlp.dense_h_to_4h.weight": "model_00005-of-00072.safetensors", "h.3.post_attention_layernorm.bias": "model_00005-of-00072.safetensors", "h.3.post_attention_layernorm.weight": "model_00005-of-00072.safetensors", "h.3.self_attention.dense.bias": "model_00005-of-00072.safetensors", "h.3.self_attention.dense.weight": "model_00005-of-00072.safetensors", "h.3.self_attention.query_key_value.bias": "model_00005-of-00072.safetensors", "h.3.self_attention.query_key_value.weight": "model_00005-of-00072.safetensors", "h.30.input_layernorm.bias": "model_00032-of-00072.safetensors", "h.30.input_layernorm.weight": "model_00032-of-00072.safetensors", "h.30.mlp.dense_4h_to_h.bias": "model_00032-of-00072.safetensors", "h.30.mlp.dense_4h_to_h.weight": "model_00032-of-00072.safetensors", "h.30.mlp.dense_h_to_4h.bias": "model_00032-of-00072.safetensors", "h.30.mlp.dense_h_to_4h.weight": "model_00032-of-00072.safetensors", "h.30.post_attention_layernorm.bias": "model_00032-of-00072.safetensors", "h.30.post_attention_layernorm.weight": "model_00032-of-00072.safetensors", "h.30.self_attention.dense.bias": "model_00032-of-00072.safetensors", "h.30.self_attention.dense.weight": "model_00032-of-00072.safetensors", "h.30.self_attention.query_key_value.bias": "model_00032-of-00072.safetensors", "h.30.self_attention.query_key_value.weight": "model_00032-of-00072.safetensors", "h.31.input_layernorm.bias": "model_00033-of-00072.safetensors", "h.31.input_layernorm.weight": "model_00033-of-00072.safetensors", "h.31.mlp.dense_4h_to_h.bias": "model_00033-of-00072.safetensors", "h.31.mlp.dense_4h_to_h.weight": "model_00033-of-00072.safetensors", "h.31.mlp.dense_h_to_4h.bias": "model_00033-of-00072.safetensors", "h.31.mlp.dense_h_to_4h.weight": "model_00033-of-00072.safetensors", "h.31.post_attention_layernorm.bias": "model_00033-of-00072.safetensors", "h.31.post_attention_layernorm.weight": "model_00033-of-00072.safetensors", "h.31.self_attention.dense.bias": "model_00033-of-00072.safetensors", "h.31.self_attention.dense.weight": "model_00033-of-00072.safetensors", "h.31.self_attention.query_key_value.bias": "model_00033-of-00072.safetensors", "h.31.self_attention.query_key_value.weight": "model_00033-of-00072.safetensors", "h.32.input_layernorm.bias": "model_00034-of-00072.safetensors", "h.32.input_layernorm.weight": "model_00034-of-00072.safetensors", "h.32.mlp.dense_4h_to_h.bias": "model_00034-of-00072.safetensors", "h.32.mlp.dense_4h_to_h.weight": "model_00034-of-00072.safetensors", "h.32.mlp.dense_h_to_4h.bias": "model_00034-of-00072.safetensors", "h.32.mlp.dense_h_to_4h.weight": "model_00034-of-00072.safetensors", "h.32.post_attention_layernorm.bias": "model_00034-of-00072.safetensors", "h.32.post_attention_layernorm.weight": "model_00034-of-00072.safetensors", "h.32.self_attention.dense.bias": "model_00034-of-00072.safetensors", "h.32.self_attention.dense.weight": "model_00034-of-00072.safetensors", "h.32.self_attention.query_key_value.bias": "model_00034-of-00072.safetensors", "h.32.self_attention.query_key_value.weight": "model_00034-of-00072.safetensors", "h.33.input_layernorm.bias": "model_00035-of-00072.safetensors", "h.33.input_layernorm.weight": "model_00035-of-00072.safetensors", "h.33.mlp.dense_4h_to_h.bias": "model_00035-of-00072.safetensors", "h.33.mlp.dense_4h_to_h.weight": "model_00035-of-00072.safetensors", "h.33.mlp.dense_h_to_4h.bias": "model_00035-of-00072.safetensors", "h.33.mlp.dense_h_to_4h.weight": "model_00035-of-00072.safetensors", "h.33.post_attention_layernorm.bias": "model_00035-of-00072.safetensors", "h.33.post_attention_layernorm.weight": "model_00035-of-00072.safetensors", "h.33.self_attention.dense.bias": "model_00035-of-00072.safetensors", "h.33.self_attention.dense.weight": "model_00035-of-00072.safetensors", "h.33.self_attention.query_key_value.bias": "model_00035-of-00072.safetensors", "h.33.self_attention.query_key_value.weight": "model_00035-of-00072.safetensors", "h.34.input_layernorm.bias": "model_00036-of-00072.safetensors", "h.34.input_layernorm.weight": "model_00036-of-00072.safetensors", "h.34.mlp.dense_4h_to_h.bias": "model_00036-of-00072.safetensors", "h.34.mlp.dense_4h_to_h.weight": "model_00036-of-00072.safetensors", "h.34.mlp.dense_h_to_4h.bias": "model_00036-of-00072.safetensors", "h.34.mlp.dense_h_to_4h.weight": "model_00036-of-00072.safetensors", "h.34.post_attention_layernorm.bias": "model_00036-of-00072.safetensors", "h.34.post_attention_layernorm.weight": "model_00036-of-00072.safetensors", "h.34.self_attention.dense.bias": "model_00036-of-00072.safetensors", "h.34.self_attention.dense.weight": "model_00036-of-00072.safetensors", "h.34.self_attention.query_key_value.bias": "model_00036-of-00072.safetensors", "h.34.self_attention.query_key_value.weight": "model_00036-of-00072.safetensors", "h.35.input_layernorm.bias": "model_00037-of-00072.safetensors", "h.35.input_layernorm.weight": "model_00037-of-00072.safetensors", "h.35.mlp.dense_4h_to_h.bias": "model_00037-of-00072.safetensors", "h.35.mlp.dense_4h_to_h.weight": "model_00037-of-00072.safetensors", "h.35.mlp.dense_h_to_4h.bias": "model_00037-of-00072.safetensors", "h.35.mlp.dense_h_to_4h.weight": "model_00037-of-00072.safetensors", "h.35.post_attention_layernorm.bias": "model_00037-of-00072.safetensors", "h.35.post_attention_layernorm.weight": "model_00037-of-00072.safetensors", "h.35.self_attention.dense.bias": "model_00037-of-00072.safetensors", "h.35.self_attention.dense.weight": "model_00037-of-00072.safetensors", "h.35.self_attention.query_key_value.bias": "model_00037-of-00072.safetensors", "h.35.self_attention.query_key_value.weight": "model_00037-of-00072.safetensors", "h.36.input_layernorm.bias": "model_00038-of-00072.safetensors", "h.36.input_layernorm.weight": "model_00038-of-00072.safetensors", "h.36.mlp.dense_4h_to_h.bias": "model_00038-of-00072.safetensors", "h.36.mlp.dense_4h_to_h.weight": "model_00038-of-00072.safetensors", "h.36.mlp.dense_h_to_4h.bias": "model_00038-of-00072.safetensors", "h.36.mlp.dense_h_to_4h.weight": "model_00038-of-00072.safetensors", "h.36.post_attention_layernorm.bias": "model_00038-of-00072.safetensors", "h.36.post_attention_layernorm.weight": "model_00038-of-00072.safetensors", "h.36.self_attention.dense.bias": "model_00038-of-00072.safetensors", "h.36.self_attention.dense.weight": "model_00038-of-00072.safetensors", "h.36.self_attention.query_key_value.bias": "model_00038-of-00072.safetensors", "h.36.self_attention.query_key_value.weight": "model_00038-of-00072.safetensors", "h.37.input_layernorm.bias": "model_00039-of-00072.safetensors", "h.37.input_layernorm.weight": "model_00039-of-00072.safetensors", "h.37.mlp.dense_4h_to_h.bias": "model_00039-of-00072.safetensors", "h.37.mlp.dense_4h_to_h.weight": "model_00039-of-00072.safetensors", "h.37.mlp.dense_h_to_4h.bias": "model_00039-of-00072.safetensors", "h.37.mlp.dense_h_to_4h.weight": "model_00039-of-00072.safetensors", "h.37.post_attention_layernorm.bias": "model_00039-of-00072.safetensors", "h.37.post_attention_layernorm.weight": "model_00039-of-00072.safetensors", "h.37.self_attention.dense.bias": "model_00039-of-00072.safetensors", "h.37.self_attention.dense.weight": "model_00039-of-00072.safetensors", "h.37.self_attention.query_key_value.bias": "model_00039-of-00072.safetensors", "h.37.self_attention.query_key_value.weight": "model_00039-of-00072.safetensors", "h.38.input_layernorm.bias": "model_00040-of-00072.safetensors", "h.38.input_layernorm.weight": "model_00040-of-00072.safetensors", "h.38.mlp.dense_4h_to_h.bias": "model_00040-of-00072.safetensors", "h.38.mlp.dense_4h_to_h.weight": "model_00040-of-00072.safetensors", "h.38.mlp.dense_h_to_4h.bias": "model_00040-of-00072.safetensors", "h.38.mlp.dense_h_to_4h.weight": "model_00040-of-00072.safetensors", "h.38.post_attention_layernorm.bias": "model_00040-of-00072.safetensors", "h.38.post_attention_layernorm.weight": "model_00040-of-00072.safetensors", "h.38.self_attention.dense.bias": "model_00040-of-00072.safetensors", "h.38.self_attention.dense.weight": "model_00040-of-00072.safetensors", "h.38.self_attention.query_key_value.bias": "model_00040-of-00072.safetensors", "h.38.self_attention.query_key_value.weight": "model_00040-of-00072.safetensors", "h.39.input_layernorm.bias": "model_00041-of-00072.safetensors", "h.39.input_layernorm.weight": "model_00041-of-00072.safetensors", "h.39.mlp.dense_4h_to_h.bias": "model_00041-of-00072.safetensors", "h.39.mlp.dense_4h_to_h.weight": "model_00041-of-00072.safetensors", "h.39.mlp.dense_h_to_4h.bias": "model_00041-of-00072.safetensors", "h.39.mlp.dense_h_to_4h.weight": "model_00041-of-00072.safetensors", "h.39.post_attention_layernorm.bias": "model_00041-of-00072.safetensors", "h.39.post_attention_layernorm.weight": "model_00041-of-00072.safetensors", "h.39.self_attention.dense.bias": "model_00041-of-00072.safetensors", "h.39.self_attention.dense.weight": "model_00041-of-00072.safetensors", "h.39.self_attention.query_key_value.bias": "model_00041-of-00072.safetensors", "h.39.self_attention.query_key_value.weight": "model_00041-of-00072.safetensors", "h.4.input_layernorm.bias": "model_00006-of-00072.safetensors", "h.4.input_layernorm.weight": "model_00006-of-00072.safetensors", "h.4.mlp.dense_4h_to_h.bias": "model_00006-of-00072.safetensors", "h.4.mlp.dense_4h_to_h.weight": "model_00006-of-00072.safetensors", "h.4.mlp.dense_h_to_4h.bias": "model_00006-of-00072.safetensors", "h.4.mlp.dense_h_to_4h.weight": "model_00006-of-00072.safetensors", "h.4.post_attention_layernorm.bias": "model_00006-of-00072.safetensors", "h.4.post_attention_layernorm.weight": "model_00006-of-00072.safetensors", "h.4.self_attention.dense.bias": "model_00006-of-00072.safetensors", "h.4.self_attention.dense.weight": "model_00006-of-00072.safetensors", "h.4.self_attention.query_key_value.bias": "model_00006-of-00072.safetensors", "h.4.self_attention.query_key_value.weight": "model_00006-of-00072.safetensors", "h.40.input_layernorm.bias": "model_00042-of-00072.safetensors", "h.40.input_layernorm.weight": "model_00042-of-00072.safetensors", "h.40.mlp.dense_4h_to_h.bias": "model_00042-of-00072.safetensors", "h.40.mlp.dense_4h_to_h.weight": "model_00042-of-00072.safetensors", "h.40.mlp.dense_h_to_4h.bias": "model_00042-of-00072.safetensors", "h.40.mlp.dense_h_to_4h.weight": "model_00042-of-00072.safetensors", "h.40.post_attention_layernorm.bias": "model_00042-of-00072.safetensors", "h.40.post_attention_layernorm.weight": "model_00042-of-00072.safetensors", "h.40.self_attention.dense.bias": "model_00042-of-00072.safetensors", "h.40.self_attention.dense.weight": "model_00042-of-00072.safetensors", "h.40.self_attention.query_key_value.bias": "model_00042-of-00072.safetensors", "h.40.self_attention.query_key_value.weight": "model_00042-of-00072.safetensors", "h.41.input_layernorm.bias": "model_00043-of-00072.safetensors", "h.41.input_layernorm.weight": "model_00043-of-00072.safetensors", "h.41.mlp.dense_4h_to_h.bias": "model_00043-of-00072.safetensors", "h.41.mlp.dense_4h_to_h.weight": "model_00043-of-00072.safetensors", "h.41.mlp.dense_h_to_4h.bias": "model_00043-of-00072.safetensors", "h.41.mlp.dense_h_to_4h.weight": "model_00043-of-00072.safetensors", "h.41.post_attention_layernorm.bias": "model_00043-of-00072.safetensors", "h.41.post_attention_layernorm.weight": "model_00043-of-00072.safetensors", "h.41.self_attention.dense.bias": "model_00043-of-00072.safetensors", "h.41.self_attention.dense.weight": "model_00043-of-00072.safetensors", "h.41.self_attention.query_key_value.bias": "model_00043-of-00072.safetensors", "h.41.self_attention.query_key_value.weight": "model_00043-of-00072.safetensors", "h.42.input_layernorm.bias": "model_00044-of-00072.safetensors", "h.42.input_layernorm.weight": "model_00044-of-00072.safetensors", "h.42.mlp.dense_4h_to_h.bias": "model_00044-of-00072.safetensors", "h.42.mlp.dense_4h_to_h.weight": "model_00044-of-00072.safetensors", "h.42.mlp.dense_h_to_4h.bias": "model_00044-of-00072.safetensors", "h.42.mlp.dense_h_to_4h.weight": "model_00044-of-00072.safetensors", "h.42.post_attention_layernorm.bias": "model_00044-of-00072.safetensors", "h.42.post_attention_layernorm.weight": "model_00044-of-00072.safetensors", "h.42.self_attention.dense.bias": "model_00044-of-00072.safetensors", "h.42.self_attention.dense.weight": "model_00044-of-00072.safetensors", "h.42.self_attention.query_key_value.bias": "model_00044-of-00072.safetensors", "h.42.self_attention.query_key_value.weight": "model_00044-of-00072.safetensors", "h.43.input_layernorm.bias": "model_00045-of-00072.safetensors", "h.43.input_layernorm.weight": "model_00045-of-00072.safetensors", "h.43.mlp.dense_4h_to_h.bias": "model_00045-of-00072.safetensors", "h.43.mlp.dense_4h_to_h.weight": "model_00045-of-00072.safetensors", "h.43.mlp.dense_h_to_4h.bias": "model_00045-of-00072.safetensors", "h.43.mlp.dense_h_to_4h.weight": "model_00045-of-00072.safetensors", "h.43.post_attention_layernorm.bias": "model_00045-of-00072.safetensors", "h.43.post_attention_layernorm.weight": "model_00045-of-00072.safetensors", "h.43.self_attention.dense.bias": "model_00045-of-00072.safetensors", "h.43.self_attention.dense.weight": "model_00045-of-00072.safetensors", "h.43.self_attention.query_key_value.bias": "model_00045-of-00072.safetensors", "h.43.self_attention.query_key_value.weight": "model_00045-of-00072.safetensors", "h.44.input_layernorm.bias": "model_00046-of-00072.safetensors", "h.44.input_layernorm.weight": "model_00046-of-00072.safetensors", "h.44.mlp.dense_4h_to_h.bias": "model_00046-of-00072.safetensors", "h.44.mlp.dense_4h_to_h.weight": "model_00046-of-00072.safetensors", "h.44.mlp.dense_h_to_4h.bias": "model_00046-of-00072.safetensors", "h.44.mlp.dense_h_to_4h.weight": "model_00046-of-00072.safetensors", "h.44.post_attention_layernorm.bias": "model_00046-of-00072.safetensors", "h.44.post_attention_layernorm.weight": "model_00046-of-00072.safetensors", "h.44.self_attention.dense.bias": "model_00046-of-00072.safetensors", "h.44.self_attention.dense.weight": "model_00046-of-00072.safetensors", "h.44.self_attention.query_key_value.bias": "model_00046-of-00072.safetensors", "h.44.self_attention.query_key_value.weight": "model_00046-of-00072.safetensors", "h.45.input_layernorm.bias": "model_00047-of-00072.safetensors", "h.45.input_layernorm.weight": "model_00047-of-00072.safetensors", "h.45.mlp.dense_4h_to_h.bias": "model_00047-of-00072.safetensors", "h.45.mlp.dense_4h_to_h.weight": "model_00047-of-00072.safetensors", "h.45.mlp.dense_h_to_4h.bias": "model_00047-of-00072.safetensors", "h.45.mlp.dense_h_to_4h.weight": "model_00047-of-00072.safetensors", "h.45.post_attention_layernorm.bias": "model_00047-of-00072.safetensors", "h.45.post_attention_layernorm.weight": "model_00047-of-00072.safetensors", "h.45.self_attention.dense.bias": "model_00047-of-00072.safetensors", "h.45.self_attention.dense.weight": "model_00047-of-00072.safetensors", "h.45.self_attention.query_key_value.bias": "model_00047-of-00072.safetensors", "h.45.self_attention.query_key_value.weight": "model_00047-of-00072.safetensors", "h.46.input_layernorm.bias": "model_00048-of-00072.safetensors", "h.46.input_layernorm.weight": "model_00048-of-00072.safetensors", "h.46.mlp.dense_4h_to_h.bias": "model_00048-of-00072.safetensors", "h.46.mlp.dense_4h_to_h.weight": "model_00048-of-00072.safetensors", "h.46.mlp.dense_h_to_4h.bias": "model_00048-of-00072.safetensors", "h.46.mlp.dense_h_to_4h.weight": "model_00048-of-00072.safetensors", "h.46.post_attention_layernorm.bias": "model_00048-of-00072.safetensors", "h.46.post_attention_layernorm.weight": "model_00048-of-00072.safetensors", "h.46.self_attention.dense.bias": "model_00048-of-00072.safetensors", "h.46.self_attention.dense.weight": "model_00048-of-00072.safetensors", "h.46.self_attention.query_key_value.bias": "model_00048-of-00072.safetensors", "h.46.self_attention.query_key_value.weight": "model_00048-of-00072.safetensors", "h.47.input_layernorm.bias": "model_00049-of-00072.safetensors", "h.47.input_layernorm.weight": "model_00049-of-00072.safetensors", "h.47.mlp.dense_4h_to_h.bias": "model_00049-of-00072.safetensors", "h.47.mlp.dense_4h_to_h.weight": "model_00049-of-00072.safetensors", "h.47.mlp.dense_h_to_4h.bias": "model_00049-of-00072.safetensors", "h.47.mlp.dense_h_to_4h.weight": "model_00049-of-00072.safetensors", "h.47.post_attention_layernorm.bias": "model_00049-of-00072.safetensors", "h.47.post_attention_layernorm.weight": "model_00049-of-00072.safetensors", "h.47.self_attention.dense.bias": "model_00049-of-00072.safetensors", "h.47.self_attention.dense.weight": "model_00049-of-00072.safetensors", "h.47.self_attention.query_key_value.bias": "model_00049-of-00072.safetensors", "h.47.self_attention.query_key_value.weight": "model_00049-of-00072.safetensors", "h.48.input_layernorm.bias": "model_00050-of-00072.safetensors", "h.48.input_layernorm.weight": "model_00050-of-00072.safetensors", "h.48.mlp.dense_4h_to_h.bias": "model_00050-of-00072.safetensors", "h.48.mlp.dense_4h_to_h.weight": "model_00050-of-00072.safetensors", "h.48.mlp.dense_h_to_4h.bias": "model_00050-of-00072.safetensors", "h.48.mlp.dense_h_to_4h.weight": "model_00050-of-00072.safetensors", "h.48.post_attention_layernorm.bias": "model_00050-of-00072.safetensors", "h.48.post_attention_layernorm.weight": "model_00050-of-00072.safetensors", "h.48.self_attention.dense.bias": "model_00050-of-00072.safetensors", "h.48.self_attention.dense.weight": "model_00050-of-00072.safetensors", "h.48.self_attention.query_key_value.bias": "model_00050-of-00072.safetensors", "h.48.self_attention.query_key_value.weight": "model_00050-of-00072.safetensors", "h.49.input_layernorm.bias": "model_00051-of-00072.safetensors", "h.49.input_layernorm.weight": "model_00051-of-00072.safetensors", "h.49.mlp.dense_4h_to_h.bias": "model_00051-of-00072.safetensors", "h.49.mlp.dense_4h_to_h.weight": "model_00051-of-00072.safetensors", "h.49.mlp.dense_h_to_4h.bias": "model_00051-of-00072.safetensors", "h.49.mlp.dense_h_to_4h.weight": "model_00051-of-00072.safetensors", "h.49.post_attention_layernorm.bias": "model_00051-of-00072.safetensors", "h.49.post_attention_layernorm.weight": "model_00051-of-00072.safetensors", "h.49.self_attention.dense.bias": "model_00051-of-00072.safetensors", "h.49.self_attention.dense.weight": "model_00051-of-00072.safetensors", "h.49.self_attention.query_key_value.bias": "model_00051-of-00072.safetensors", "h.49.self_attention.query_key_value.weight": "model_00051-of-00072.safetensors", "h.5.input_layernorm.bias": "model_00007-of-00072.safetensors", "h.5.input_layernorm.weight": "model_00007-of-00072.safetensors", "h.5.mlp.dense_4h_to_h.bias": "model_00007-of-00072.safetensors", "h.5.mlp.dense_4h_to_h.weight": "model_00007-of-00072.safetensors", "h.5.mlp.dense_h_to_4h.bias": "model_00007-of-00072.safetensors", "h.5.mlp.dense_h_to_4h.weight": "model_00007-of-00072.safetensors", "h.5.post_attention_layernorm.bias": "model_00007-of-00072.safetensors", "h.5.post_attention_layernorm.weight": "model_00007-of-00072.safetensors", "h.5.self_attention.dense.bias": "model_00007-of-00072.safetensors", "h.5.self_attention.dense.weight": "model_00007-of-00072.safetensors", "h.5.self_attention.query_key_value.bias": "model_00007-of-00072.safetensors", "h.5.self_attention.query_key_value.weight": "model_00007-of-00072.safetensors", "h.50.input_layernorm.bias": "model_00052-of-00072.safetensors", "h.50.input_layernorm.weight": "model_00052-of-00072.safetensors", "h.50.mlp.dense_4h_to_h.bias": "model_00052-of-00072.safetensors", "h.50.mlp.dense_4h_to_h.weight": "model_00052-of-00072.safetensors", "h.50.mlp.dense_h_to_4h.bias": "model_00052-of-00072.safetensors", "h.50.mlp.dense_h_to_4h.weight": "model_00052-of-00072.safetensors", "h.50.post_attention_layernorm.bias": "model_00052-of-00072.safetensors", "h.50.post_attention_layernorm.weight": "model_00052-of-00072.safetensors", "h.50.self_attention.dense.bias": "model_00052-of-00072.safetensors", "h.50.self_attention.dense.weight": "model_00052-of-00072.safetensors", "h.50.self_attention.query_key_value.bias": "model_00052-of-00072.safetensors", "h.50.self_attention.query_key_value.weight": "model_00052-of-00072.safetensors", "h.51.input_layernorm.bias": "model_00053-of-00072.safetensors", "h.51.input_layernorm.weight": "model_00053-of-00072.safetensors", "h.51.mlp.dense_4h_to_h.bias": "model_00053-of-00072.safetensors", "h.51.mlp.dense_4h_to_h.weight": "model_00053-of-00072.safetensors", "h.51.mlp.dense_h_to_4h.bias": "model_00053-of-00072.safetensors", "h.51.mlp.dense_h_to_4h.weight": "model_00053-of-00072.safetensors", "h.51.post_attention_layernorm.bias": "model_00053-of-00072.safetensors", "h.51.post_attention_layernorm.weight": "model_00053-of-00072.safetensors", "h.51.self_attention.dense.bias": "model_00053-of-00072.safetensors", "h.51.self_attention.dense.weight": "model_00053-of-00072.safetensors", "h.51.self_attention.query_key_value.bias": "model_00053-of-00072.safetensors", "h.51.self_attention.query_key_value.weight": "model_00053-of-00072.safetensors", "h.52.input_layernorm.bias": "model_00054-of-00072.safetensors", "h.52.input_layernorm.weight": "model_00054-of-00072.safetensors", "h.52.mlp.dense_4h_to_h.bias": "model_00054-of-00072.safetensors", "h.52.mlp.dense_4h_to_h.weight": "model_00054-of-00072.safetensors", "h.52.mlp.dense_h_to_4h.bias": "model_00054-of-00072.safetensors", "h.52.mlp.dense_h_to_4h.weight": "model_00054-of-00072.safetensors", "h.52.post_attention_layernorm.bias": "model_00054-of-00072.safetensors", "h.52.post_attention_layernorm.weight": "model_00054-of-00072.safetensors", "h.52.self_attention.dense.bias": "model_00054-of-00072.safetensors", "h.52.self_attention.dense.weight": "model_00054-of-00072.safetensors", "h.52.self_attention.query_key_value.bias": "model_00054-of-00072.safetensors", "h.52.self_attention.query_key_value.weight": "model_00054-of-00072.safetensors", "h.53.input_layernorm.bias": "model_00055-of-00072.safetensors", "h.53.input_layernorm.weight": "model_00055-of-00072.safetensors", "h.53.mlp.dense_4h_to_h.bias": "model_00055-of-00072.safetensors", "h.53.mlp.dense_4h_to_h.weight": "model_00055-of-00072.safetensors", "h.53.mlp.dense_h_to_4h.bias": "model_00055-of-00072.safetensors", "h.53.mlp.dense_h_to_4h.weight": "model_00055-of-00072.safetensors", "h.53.post_attention_layernorm.bias": "model_00055-of-00072.safetensors", "h.53.post_attention_layernorm.weight": "model_00055-of-00072.safetensors", "h.53.self_attention.dense.bias": "model_00055-of-00072.safetensors", "h.53.self_attention.dense.weight": "model_00055-of-00072.safetensors", "h.53.self_attention.query_key_value.bias": "model_00055-of-00072.safetensors", "h.53.self_attention.query_key_value.weight": "model_00055-of-00072.safetensors", "h.54.input_layernorm.bias": "model_00056-of-00072.safetensors", "h.54.input_layernorm.weight": "model_00056-of-00072.safetensors", "h.54.mlp.dense_4h_to_h.bias": "model_00056-of-00072.safetensors", "h.54.mlp.dense_4h_to_h.weight": "model_00056-of-00072.safetensors", "h.54.mlp.dense_h_to_4h.bias": "model_00056-of-00072.safetensors", "h.54.mlp.dense_h_to_4h.weight": "model_00056-of-00072.safetensors", "h.54.post_attention_layernorm.bias": "model_00056-of-00072.safetensors", "h.54.post_attention_layernorm.weight": "model_00056-of-00072.safetensors", "h.54.self_attention.dense.bias": "model_00056-of-00072.safetensors", "h.54.self_attention.dense.weight": "model_00056-of-00072.safetensors", "h.54.self_attention.query_key_value.bias": "model_00056-of-00072.safetensors", "h.54.self_attention.query_key_value.weight": "model_00056-of-00072.safetensors", "h.55.input_layernorm.bias": "model_00057-of-00072.safetensors", "h.55.input_layernorm.weight": "model_00057-of-00072.safetensors", "h.55.mlp.dense_4h_to_h.bias": "model_00057-of-00072.safetensors", "h.55.mlp.dense_4h_to_h.weight": "model_00057-of-00072.safetensors", "h.55.mlp.dense_h_to_4h.bias": "model_00057-of-00072.safetensors", "h.55.mlp.dense_h_to_4h.weight": "model_00057-of-00072.safetensors", "h.55.post_attention_layernorm.bias": "model_00057-of-00072.safetensors", "h.55.post_attention_layernorm.weight": "model_00057-of-00072.safetensors", "h.55.self_attention.dense.bias": "model_00057-of-00072.safetensors", "h.55.self_attention.dense.weight": "model_00057-of-00072.safetensors", "h.55.self_attention.query_key_value.bias": "model_00057-of-00072.safetensors", "h.55.self_attention.query_key_value.weight": "model_00057-of-00072.safetensors", "h.56.input_layernorm.bias": "model_00058-of-00072.safetensors", "h.56.input_layernorm.weight": "model_00058-of-00072.safetensors", "h.56.mlp.dense_4h_to_h.bias": "model_00058-of-00072.safetensors", "h.56.mlp.dense_4h_to_h.weight": "model_00058-of-00072.safetensors", "h.56.mlp.dense_h_to_4h.bias": "model_00058-of-00072.safetensors", "h.56.mlp.dense_h_to_4h.weight": "model_00058-of-00072.safetensors", "h.56.post_attention_layernorm.bias": "model_00058-of-00072.safetensors", "h.56.post_attention_layernorm.weight": "model_00058-of-00072.safetensors", "h.56.self_attention.dense.bias": "model_00058-of-00072.safetensors", "h.56.self_attention.dense.weight": "model_00058-of-00072.safetensors", "h.56.self_attention.query_key_value.bias": "model_00058-of-00072.safetensors", "h.56.self_attention.query_key_value.weight": "model_00058-of-00072.safetensors", "h.57.input_layernorm.bias": "model_00059-of-00072.safetensors", "h.57.input_layernorm.weight": "model_00059-of-00072.safetensors", "h.57.mlp.dense_4h_to_h.bias": "model_00059-of-00072.safetensors", "h.57.mlp.dense_4h_to_h.weight": "model_00059-of-00072.safetensors", "h.57.mlp.dense_h_to_4h.bias": "model_00059-of-00072.safetensors", "h.57.mlp.dense_h_to_4h.weight": "model_00059-of-00072.safetensors", "h.57.post_attention_layernorm.bias": "model_00059-of-00072.safetensors", "h.57.post_attention_layernorm.weight": "model_00059-of-00072.safetensors", "h.57.self_attention.dense.bias": "model_00059-of-00072.safetensors", "h.57.self_attention.dense.weight": "model_00059-of-00072.safetensors", "h.57.self_attention.query_key_value.bias": "model_00059-of-00072.safetensors", "h.57.self_attention.query_key_value.weight": "model_00059-of-00072.safetensors", "h.58.input_layernorm.bias": "model_00060-of-00072.safetensors", "h.58.input_layernorm.weight": "model_00060-of-00072.safetensors", "h.58.mlp.dense_4h_to_h.bias": "model_00060-of-00072.safetensors", "h.58.mlp.dense_4h_to_h.weight": "model_00060-of-00072.safetensors", "h.58.mlp.dense_h_to_4h.bias": "model_00060-of-00072.safetensors", "h.58.mlp.dense_h_to_4h.weight": "model_00060-of-00072.safetensors", "h.58.post_attention_layernorm.bias": "model_00060-of-00072.safetensors", "h.58.post_attention_layernorm.weight": "model_00060-of-00072.safetensors", "h.58.self_attention.dense.bias": "model_00060-of-00072.safetensors", "h.58.self_attention.dense.weight": "model_00060-of-00072.safetensors", "h.58.self_attention.query_key_value.bias": "model_00060-of-00072.safetensors", "h.58.self_attention.query_key_value.weight": "model_00060-of-00072.safetensors", "h.59.input_layernorm.bias": "model_00061-of-00072.safetensors", "h.59.input_layernorm.weight": "model_00061-of-00072.safetensors", "h.59.mlp.dense_4h_to_h.bias": "model_00061-of-00072.safetensors", "h.59.mlp.dense_4h_to_h.weight": "model_00061-of-00072.safetensors", "h.59.mlp.dense_h_to_4h.bias": "model_00061-of-00072.safetensors", "h.59.mlp.dense_h_to_4h.weight": "model_00061-of-00072.safetensors", "h.59.post_attention_layernorm.bias": "model_00061-of-00072.safetensors", "h.59.post_attention_layernorm.weight": "model_00061-of-00072.safetensors", "h.59.self_attention.dense.bias": "model_00061-of-00072.safetensors", "h.59.self_attention.dense.weight": "model_00061-of-00072.safetensors", "h.59.self_attention.query_key_value.bias": "model_00061-of-00072.safetensors", "h.59.self_attention.query_key_value.weight": "model_00061-of-00072.safetensors", "h.6.input_layernorm.bias": "model_00008-of-00072.safetensors", "h.6.input_layernorm.weight": "model_00008-of-00072.safetensors", "h.6.mlp.dense_4h_to_h.bias": "model_00008-of-00072.safetensors", "h.6.mlp.dense_4h_to_h.weight": "model_00008-of-00072.safetensors", "h.6.mlp.dense_h_to_4h.bias": "model_00008-of-00072.safetensors", "h.6.mlp.dense_h_to_4h.weight": "model_00008-of-00072.safetensors", "h.6.post_attention_layernorm.bias": "model_00008-of-00072.safetensors", "h.6.post_attention_layernorm.weight": "model_00008-of-00072.safetensors", "h.6.self_attention.dense.bias": "model_00008-of-00072.safetensors", "h.6.self_attention.dense.weight": "model_00008-of-00072.safetensors", "h.6.self_attention.query_key_value.bias": "model_00008-of-00072.safetensors", "h.6.self_attention.query_key_value.weight": "model_00008-of-00072.safetensors", "h.60.input_layernorm.bias": "model_00062-of-00072.safetensors", "h.60.input_layernorm.weight": "model_00062-of-00072.safetensors", "h.60.mlp.dense_4h_to_h.bias": "model_00062-of-00072.safetensors", "h.60.mlp.dense_4h_to_h.weight": "model_00062-of-00072.safetensors", "h.60.mlp.dense_h_to_4h.bias": "model_00062-of-00072.safetensors", "h.60.mlp.dense_h_to_4h.weight": "model_00062-of-00072.safetensors", "h.60.post_attention_layernorm.bias": "model_00062-of-00072.safetensors", "h.60.post_attention_layernorm.weight": "model_00062-of-00072.safetensors", "h.60.self_attention.dense.bias": "model_00062-of-00072.safetensors", "h.60.self_attention.dense.weight": "model_00062-of-00072.safetensors", "h.60.self_attention.query_key_value.bias": "model_00062-of-00072.safetensors", "h.60.self_attention.query_key_value.weight": "model_00062-of-00072.safetensors", "h.61.input_layernorm.bias": "model_00063-of-00072.safetensors", "h.61.input_layernorm.weight": "model_00063-of-00072.safetensors", "h.61.mlp.dense_4h_to_h.bias": "model_00063-of-00072.safetensors", "h.61.mlp.dense_4h_to_h.weight": "model_00063-of-00072.safetensors", "h.61.mlp.dense_h_to_4h.bias": "model_00063-of-00072.safetensors", "h.61.mlp.dense_h_to_4h.weight": "model_00063-of-00072.safetensors", "h.61.post_attention_layernorm.bias": "model_00063-of-00072.safetensors", "h.61.post_attention_layernorm.weight": "model_00063-of-00072.safetensors", "h.61.self_attention.dense.bias": "model_00063-of-00072.safetensors", "h.61.self_attention.dense.weight": "model_00063-of-00072.safetensors", "h.61.self_attention.query_key_value.bias": "model_00063-of-00072.safetensors", "h.61.self_attention.query_key_value.weight": "model_00063-of-00072.safetensors", "h.62.input_layernorm.bias": "model_00064-of-00072.safetensors", "h.62.input_layernorm.weight": "model_00064-of-00072.safetensors", "h.62.mlp.dense_4h_to_h.bias": "model_00064-of-00072.safetensors", "h.62.mlp.dense_4h_to_h.weight": "model_00064-of-00072.safetensors", "h.62.mlp.dense_h_to_4h.bias": "model_00064-of-00072.safetensors", "h.62.mlp.dense_h_to_4h.weight": "model_00064-of-00072.safetensors", "h.62.post_attention_layernorm.bias": "model_00064-of-00072.safetensors", "h.62.post_attention_layernorm.weight": "model_00064-of-00072.safetensors", "h.62.self_attention.dense.bias": "model_00064-of-00072.safetensors", "h.62.self_attention.dense.weight": "model_00064-of-00072.safetensors", "h.62.self_attention.query_key_value.bias": "model_00064-of-00072.safetensors", "h.62.self_attention.query_key_value.weight": "model_00064-of-00072.safetensors", "h.63.input_layernorm.bias": "model_00065-of-00072.safetensors", "h.63.input_layernorm.weight": "model_00065-of-00072.safetensors", "h.63.mlp.dense_4h_to_h.bias": "model_00065-of-00072.safetensors", "h.63.mlp.dense_4h_to_h.weight": "model_00065-of-00072.safetensors", "h.63.mlp.dense_h_to_4h.bias": "model_00065-of-00072.safetensors", "h.63.mlp.dense_h_to_4h.weight": "model_00065-of-00072.safetensors", "h.63.post_attention_layernorm.bias": "model_00065-of-00072.safetensors", "h.63.post_attention_layernorm.weight": "model_00065-of-00072.safetensors", "h.63.self_attention.dense.bias": "model_00065-of-00072.safetensors", "h.63.self_attention.dense.weight": "model_00065-of-00072.safetensors", "h.63.self_attention.query_key_value.bias": "model_00065-of-00072.safetensors", "h.63.self_attention.query_key_value.weight": "model_00065-of-00072.safetensors", "h.64.input_layernorm.bias": "model_00066-of-00072.safetensors", "h.64.input_layernorm.weight": "model_00066-of-00072.safetensors", "h.64.mlp.dense_4h_to_h.bias": "model_00066-of-00072.safetensors", "h.64.mlp.dense_4h_to_h.weight": "model_00066-of-00072.safetensors", "h.64.mlp.dense_h_to_4h.bias": "model_00066-of-00072.safetensors", "h.64.mlp.dense_h_to_4h.weight": "model_00066-of-00072.safetensors", "h.64.post_attention_layernorm.bias": "model_00066-of-00072.safetensors", "h.64.post_attention_layernorm.weight": "model_00066-of-00072.safetensors", "h.64.self_attention.dense.bias": "model_00066-of-00072.safetensors", "h.64.self_attention.dense.weight": "model_00066-of-00072.safetensors", "h.64.self_attention.query_key_value.bias": "model_00066-of-00072.safetensors", "h.64.self_attention.query_key_value.weight": "model_00066-of-00072.safetensors", "h.65.input_layernorm.bias": "model_00067-of-00072.safetensors", "h.65.input_layernorm.weight": "model_00067-of-00072.safetensors", "h.65.mlp.dense_4h_to_h.bias": "model_00067-of-00072.safetensors", "h.65.mlp.dense_4h_to_h.weight": "model_00067-of-00072.safetensors", "h.65.mlp.dense_h_to_4h.bias": "model_00067-of-00072.safetensors", "h.65.mlp.dense_h_to_4h.weight": "model_00067-of-00072.safetensors", "h.65.post_attention_layernorm.bias": "model_00067-of-00072.safetensors", "h.65.post_attention_layernorm.weight": "model_00067-of-00072.safetensors", "h.65.self_attention.dense.bias": "model_00067-of-00072.safetensors", "h.65.self_attention.dense.weight": "model_00067-of-00072.safetensors", "h.65.self_attention.query_key_value.bias": "model_00067-of-00072.safetensors", "h.65.self_attention.query_key_value.weight": "model_00067-of-00072.safetensors", "h.66.input_layernorm.bias": "model_00068-of-00072.safetensors", "h.66.input_layernorm.weight": "model_00068-of-00072.safetensors", "h.66.mlp.dense_4h_to_h.bias": "model_00068-of-00072.safetensors", "h.66.mlp.dense_4h_to_h.weight": "model_00068-of-00072.safetensors", "h.66.mlp.dense_h_to_4h.bias": "model_00068-of-00072.safetensors", "h.66.mlp.dense_h_to_4h.weight": "model_00068-of-00072.safetensors", "h.66.post_attention_layernorm.bias": "model_00068-of-00072.safetensors", "h.66.post_attention_layernorm.weight": "model_00068-of-00072.safetensors", "h.66.self_attention.dense.bias": "model_00068-of-00072.safetensors", "h.66.self_attention.dense.weight": "model_00068-of-00072.safetensors", "h.66.self_attention.query_key_value.bias": "model_00068-of-00072.safetensors", "h.66.self_attention.query_key_value.weight": "model_00068-of-00072.safetensors", "h.67.input_layernorm.bias": "model_00069-of-00072.safetensors", "h.67.input_layernorm.weight": "model_00069-of-00072.safetensors", "h.67.mlp.dense_4h_to_h.bias": "model_00069-of-00072.safetensors", "h.67.mlp.dense_4h_to_h.weight": "model_00069-of-00072.safetensors", "h.67.mlp.dense_h_to_4h.bias": "model_00069-of-00072.safetensors", "h.67.mlp.dense_h_to_4h.weight": "model_00069-of-00072.safetensors", "h.67.post_attention_layernorm.bias": "model_00069-of-00072.safetensors", "h.67.post_attention_layernorm.weight": "model_00069-of-00072.safetensors", "h.67.self_attention.dense.bias": "model_00069-of-00072.safetensors", "h.67.self_attention.dense.weight": "model_00069-of-00072.safetensors", "h.67.self_attention.query_key_value.bias": "model_00069-of-00072.safetensors", "h.67.self_attention.query_key_value.weight": "model_00069-of-00072.safetensors", "h.68.input_layernorm.bias": "model_00070-of-00072.safetensors", "h.68.input_layernorm.weight": "model_00070-of-00072.safetensors", "h.68.mlp.dense_4h_to_h.bias": "model_00070-of-00072.safetensors", "h.68.mlp.dense_4h_to_h.weight": "model_00070-of-00072.safetensors", "h.68.mlp.dense_h_to_4h.bias": "model_00070-of-00072.safetensors", "h.68.mlp.dense_h_to_4h.weight": "model_00070-of-00072.safetensors", "h.68.post_attention_layernorm.bias": "model_00070-of-00072.safetensors", "h.68.post_attention_layernorm.weight": "model_00070-of-00072.safetensors", "h.68.self_attention.dense.bias": "model_00070-of-00072.safetensors", "h.68.self_attention.dense.weight": "model_00070-of-00072.safetensors", "h.68.self_attention.query_key_value.bias": "model_00070-of-00072.safetensors", "h.68.self_attention.query_key_value.weight": "model_00070-of-00072.safetensors", "h.69.input_layernorm.bias": "model_00071-of-00072.safetensors", "h.69.input_layernorm.weight": "model_00071-of-00072.safetensors", "h.69.mlp.dense_4h_to_h.bias": "model_00071-of-00072.safetensors", "h.69.mlp.dense_4h_to_h.weight": "model_00071-of-00072.safetensors", "h.69.mlp.dense_h_to_4h.bias": "model_00071-of-00072.safetensors", "h.69.mlp.dense_h_to_4h.weight": "model_00071-of-00072.safetensors", "h.69.post_attention_layernorm.bias": "model_00071-of-00072.safetensors", "h.69.post_attention_layernorm.weight": "model_00071-of-00072.safetensors", "h.69.self_attention.dense.bias": "model_00071-of-00072.safetensors", "h.69.self_attention.dense.weight": "model_00071-of-00072.safetensors", "h.69.self_attention.query_key_value.bias": "model_00071-of-00072.safetensors", "h.69.self_attention.query_key_value.weight": "model_00071-of-00072.safetensors", "h.7.input_layernorm.bias": "model_00009-of-00072.safetensors", "h.7.input_layernorm.weight": "model_00009-of-00072.safetensors", "h.7.mlp.dense_4h_to_h.bias": "model_00009-of-00072.safetensors", "h.7.mlp.dense_4h_to_h.weight": "model_00009-of-00072.safetensors", "h.7.mlp.dense_h_to_4h.bias": "model_00009-of-00072.safetensors", "h.7.mlp.dense_h_to_4h.weight": "model_00009-of-00072.safetensors", "h.7.post_attention_layernorm.bias": "model_00009-of-00072.safetensors", "h.7.post_attention_layernorm.weight": "model_00009-of-00072.safetensors", "h.7.self_attention.dense.bias": "model_00009-of-00072.safetensors", "h.7.self_attention.dense.weight": "model_00009-of-00072.safetensors", "h.7.self_attention.query_key_value.bias": "model_00009-of-00072.safetensors", "h.7.self_attention.query_key_value.weight": "model_00009-of-00072.safetensors", "h.8.input_layernorm.bias": "model_00010-of-00072.safetensors", "h.8.input_layernorm.weight": "model_00010-of-00072.safetensors", "h.8.mlp.dense_4h_to_h.bias": "model_00010-of-00072.safetensors", "h.8.mlp.dense_4h_to_h.weight": "model_00010-of-00072.safetensors", "h.8.mlp.dense_h_to_4h.bias": "model_00010-of-00072.safetensors", "h.8.mlp.dense_h_to_4h.weight": "model_00010-of-00072.safetensors", "h.8.post_attention_layernorm.bias": "model_00010-of-00072.safetensors", "h.8.post_attention_layernorm.weight": "model_00010-of-00072.safetensors", "h.8.self_attention.dense.bias": "model_00010-of-00072.safetensors", "h.8.self_attention.dense.weight": "model_00010-of-00072.safetensors", "h.8.self_attention.query_key_value.bias": "model_00010-of-00072.safetensors", "h.8.self_attention.query_key_value.weight": "model_00010-of-00072.safetensors", "h.9.input_layernorm.bias": "model_00011-of-00072.safetensors", "h.9.input_layernorm.weight": "model_00011-of-00072.safetensors", "h.9.mlp.dense_4h_to_h.bias": "model_00011-of-00072.safetensors", "h.9.mlp.dense_4h_to_h.weight": "model_00011-of-00072.safetensors", "h.9.mlp.dense_h_to_4h.bias": "model_00011-of-00072.safetensors", "h.9.mlp.dense_h_to_4h.weight": "model_00011-of-00072.safetensors", "h.9.post_attention_layernorm.bias": "model_00011-of-00072.safetensors", "h.9.post_attention_layernorm.weight": "model_00011-of-00072.safetensors", "h.9.self_attention.dense.bias": "model_00011-of-00072.safetensors", "h.9.self_attention.dense.weight": "model_00011-of-00072.safetensors", "h.9.self_attention.query_key_value.bias": "model_00011-of-00072.safetensors", "h.9.self_attention.query_key_value.weight": "model_00011-of-00072.safetensors", "ln_f.bias": "model_00072-of-00072.safetensors", "ln_f.weight": "model_00072-of-00072.safetensors", "word_embeddings.weight": "model_00001-of-00072.safetensors", "word_embeddings_layernorm.bias": "model_00001-of-00072.safetensors", "word_embeddings_layernorm.weight": "model_00001-of-00072.safetensors"}}
\ No newline at end of file
diff --git a/model_00001-of-00072.safetensors b/model_00001-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..30260d66051b57fb8fdbbb2c60f7ebe339607f9b
--- /dev/null
+++ b/model_00001-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:994b72408da2fd0cd99854528e5db5323fa7f98998e928478b7b9b2961fa7c19
+size 7193289051
diff --git a/model_00002-of-00072.safetensors b/model_00002-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..16910045a373267445051816e83d62cab2e35178
--- /dev/null
+++ b/model_00002-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e2b0689f9a6c1137f5ce2ddd6a7d3d2708e86334174175443265a288b5c42f9b
+size 4932875531
diff --git a/model_00003-of-00072.safetensors b/model_00003-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..898eec6e4e07c6dc4d16773a4a4afa6b12ca3e14
--- /dev/null
+++ b/model_00003-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b44a492e74c13fa0e7a5a64c288ed341824ec100a36a72401561442d6bcc6841
+size 4932875531
diff --git a/model_00004-of-00072.safetensors b/model_00004-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d0ba5fc5405621441bcafaf8952c68792a372cc7
--- /dev/null
+++ b/model_00004-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8b30c540c26f99c3c5d7e4ad02a58a422031534a00196f990b9ad24af79b7904
+size 4932875531
diff --git a/model_00005-of-00072.safetensors b/model_00005-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e757db00edfbe0dbc1ffc561e9564686ea4c717c
--- /dev/null
+++ b/model_00005-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:98a117f92df94f4ee63f823ab0890b3cf31c9186625b368f267b65da5cfed559
+size 4932875531
diff --git a/model_00006-of-00072.safetensors b/model_00006-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f0d6177e2e68211d9eb40971e5ac97ec224905d1
--- /dev/null
+++ b/model_00006-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dca2e322c85eaf4afc067b1afa5c172f81ddcafc20d13adc9fc806846e62cca5
+size 4932875531
diff --git a/model_00007-of-00072.safetensors b/model_00007-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1f4f63e64e615ba9a40e3b3d179f1672d4e87112
--- /dev/null
+++ b/model_00007-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a6f6504ff6354a2dbf3110a6a50daf24e7d9b7a29bb5891572559ce78b71780
+size 4932875531
diff --git a/model_00008-of-00072.safetensors b/model_00008-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c4b68e57c3c8eb8dc801205684a2be7767c29621
--- /dev/null
+++ b/model_00008-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c62f5a9b1cfdb6e14a678caa704186a4000cedeb6a047a434ddcffc323229806
+size 4932875531
diff --git a/model_00009-of-00072.safetensors b/model_00009-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..56014626d2aa0a6df827ad424a9bf3591c45bdf1
--- /dev/null
+++ b/model_00009-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:45d609a80c4162319f7652ea44f168221f82759c3a320cfac3660bf818f708c3
+size 4932875531
diff --git a/model_00010-of-00072.safetensors b/model_00010-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bce7da7b7609c175a30b4139086365b683dacced
--- /dev/null
+++ b/model_00010-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3cc4965d0bbde6392185bc8ba792a5b599b6ea39726b57d6e8e752542f938a49
+size 4932875531
diff --git a/model_00011-of-00072.safetensors b/model_00011-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cb44bf310039869503f0d91bf86a07bc5937491c
--- /dev/null
+++ b/model_00011-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb964b7ac826ec9fddc2eb61d5fdd32653bc855a14c16f4bbe56924385e117ef
+size 4932875531
diff --git a/model_00012-of-00072.safetensors b/model_00012-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..75d8deea9dc16fd835d9eafe234b52377066a290
--- /dev/null
+++ b/model_00012-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7b535b3ec8c447c220aa612c0f8a8ca17928427e9fdd13915a853e98a54de633
+size 4932875543
diff --git a/model_00013-of-00072.safetensors b/model_00013-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bb7f0a3cb224f2faddb5755a5592e18af75e7eda
--- /dev/null
+++ b/model_00013-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6498da058b0a9f36b12a13684047517f0fc863980847c0d3df8e3085df4f723e
+size 4932875543
diff --git a/model_00014-of-00072.safetensors b/model_00014-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..105e4696c6936c93b4b03d6535db9c0055b54292
--- /dev/null
+++ b/model_00014-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5de752a5c66543d8adb7548f2cb6121cefb0edcfbcdcff61cdc39aa5c0a31ad6
+size 4932875543
diff --git a/model_00015-of-00072.safetensors b/model_00015-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..aa88e24243ce7bbc25c4fab228df45dd73be3392
--- /dev/null
+++ b/model_00015-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:423abb3cb74c83c1d9e6887b18adfa8d4349c7c62b8494addabc4bcd5eddbd23
+size 4932875543
diff --git a/model_00016-of-00072.safetensors b/model_00016-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9925d00b39836fa045f7cc8481787d70f40cbc69
--- /dev/null
+++ b/model_00016-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5eeaf9ecd49277fb9551eea8dee683e278cfc8f18a497692199bb26e334f6eac
+size 4932875543
diff --git a/model_00017-of-00072.safetensors b/model_00017-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b3cff9996ad7b3b50bfc2c838c03567e14ee7acc
--- /dev/null
+++ b/model_00017-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49050db778b4fe213963108dc8d76b8718b35889a8a9f12fb01f6880c5def9c0
+size 4932875543
diff --git a/model_00018-of-00072.safetensors b/model_00018-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..eca59991e53aee8414d916d494f00710e364f405
--- /dev/null
+++ b/model_00018-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:456d316970ba92785b6f52f5ff998ceaad96cb9464633823fa8dca29aaa6ad09
+size 4932875543
diff --git a/model_00019-of-00072.safetensors b/model_00019-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..65c1638dfd10f19ac287f18145c7254d87323a46
--- /dev/null
+++ b/model_00019-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b21e46c69790640a99841d7b23d640275946b7c99a6f2b7985c7c816584a407
+size 4932875543
diff --git a/model_00020-of-00072.safetensors b/model_00020-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ce8868dad79a2901cb0c98c13c1f275282256594
--- /dev/null
+++ b/model_00020-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a8acd344ce56493e4901d406027bf9f88385d4c68594d48214af59cf78534a94
+size 4932875543
diff --git a/model_00021-of-00072.safetensors b/model_00021-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c899195a5caf37548e70a57290566cc44f3384e4
--- /dev/null
+++ b/model_00021-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2b48bdd0b8a01e599a6e4e607692ddc0505818735ca4ab4b2371da733a9b35e1
+size 4932875543
diff --git a/model_00022-of-00072.safetensors b/model_00022-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..07cb2d1db4f0d43e662b08ab86d551e883361ec5
--- /dev/null
+++ b/model_00022-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5897e2f0a9683b9d49811fe30deb461e4d30c5c37034953fe31c9515befd34a1
+size 4932875543
diff --git a/model_00023-of-00072.safetensors b/model_00023-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1231220127541975d881968503ceb89ab2e2c91a
--- /dev/null
+++ b/model_00023-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0740d2798a12687cd10985a7ffa88d22111168ba59866aa53799b8a8e1c5fda1
+size 4932875543
diff --git a/model_00024-of-00072.safetensors b/model_00024-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..93888ffe95e1427ad619c8b76a487a12442aaf56
--- /dev/null
+++ b/model_00024-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:697d91fb41a3015613a1b2bae5fc3224af7c81dcfa43796af5e1dc1cb9d872ad
+size 4932875543
diff --git a/model_00025-of-00072.safetensors b/model_00025-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b47e8efd2b8481025c9e3bb897aa754e7fd2ecce
--- /dev/null
+++ b/model_00025-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2146ea66a8d6d7fa762b9b8084f9f1b29a445e8b0bef46694af44e9894a04ecf
+size 4932875543
diff --git a/model_00026-of-00072.safetensors b/model_00026-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8552264e0fabc568b7978d5689fd732a32421dc4
--- /dev/null
+++ b/model_00026-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:95e0948f76650b956f6976aa0eabd8194e3b80430e171df3d14eeecb2c5c4a70
+size 4932875543
diff --git a/model_00027-of-00072.safetensors b/model_00027-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..13e56418f21bf2f1aef49565af3fe645f335a185
--- /dev/null
+++ b/model_00027-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f66ce06a60cd3b3b085dbebeff833cd5510047c299e98dc87b936ab2d5c9bc52
+size 4932875543
diff --git a/model_00028-of-00072.safetensors b/model_00028-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a66bf89ad5c9d9c713c23f24a49798899fa60bea
--- /dev/null
+++ b/model_00028-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3e12fdebc4f3cb0e92754ed1b379f4edb1422632e031d7804f08f436d84e036
+size 4932875543
diff --git a/model_00029-of-00072.safetensors b/model_00029-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2311d77a4b9de24a95dd491e0415be4bae62e142
--- /dev/null
+++ b/model_00029-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:68ed59dc66836d6034ed5da884d1812a760966416e7294c987e9ffb2ce240c24
+size 4932875543
diff --git a/model_00030-of-00072.safetensors b/model_00030-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bb3f010dc6aa9f6e036ad4265094c56a32cc7df0
--- /dev/null
+++ b/model_00030-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec26a9dd14d23fedbb82edfe0879d5f1503e5a051eb308c831a11238fb4294fa
+size 4932875543
diff --git a/model_00031-of-00072.safetensors b/model_00031-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..67900c9a64eeedda1192255d6fefc1e6947ece53
--- /dev/null
+++ b/model_00031-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a2e0c3318aabb013d4a48ff871c4550d718c2f68b7088051637303425e033f45
+size 4932875543
diff --git a/model_00032-of-00072.safetensors b/model_00032-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..602ec416f6f2a130e38752c30fa4adcaf9c7cf2c
--- /dev/null
+++ b/model_00032-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0776f0a61f6df60732edefe23d6990c22eba306693857df077c083c234e79235
+size 4932875543
diff --git a/model_00033-of-00072.safetensors b/model_00033-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d84a6de3c3370f8c333ba073f855888caa06cfae
--- /dev/null
+++ b/model_00033-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:22ee6e7be1a916a67e6b3c707411ca9f2460b3c290fe9a59cab948e3ea1d78d6
+size 4932875543
diff --git a/model_00034-of-00072.safetensors b/model_00034-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..681109c6abaa6755c5ec47230f7f3bb92fe80cd6
--- /dev/null
+++ b/model_00034-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b5b413253cf5a9afc8c6e30962bad03ebddeb8e05ff79a38be11045d680ff09
+size 4932875543
diff --git a/model_00035-of-00072.safetensors b/model_00035-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..94c3e5aaf7a1c62b1aa5d18ccbc27e20eeddd54e
--- /dev/null
+++ b/model_00035-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:97faa992fbfcc4f8d3ad4ac8bbc274c8a19d969a4693d37a5705d087d02dcc97
+size 4932875543
diff --git a/model_00036-of-00072.safetensors b/model_00036-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..46fda16e47018ac58c7dbe7c0d5dd05f44c5b8da
--- /dev/null
+++ b/model_00036-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df3fd31785ac9071d7373ea080bc0add35cb5e9da80b6032acf5b7a3da6740a7
+size 4932875543
diff --git a/model_00037-of-00072.safetensors b/model_00037-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7f8522f68d5f0073e30d09c2646a8c11dea98115
--- /dev/null
+++ b/model_00037-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5204f0a325dd6957ac7fb50721ea673bc3aec77f0c0b321d296523c512ed9c38
+size 4932875543
diff --git a/model_00038-of-00072.safetensors b/model_00038-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7e4fe642ed8d165cc30418665ac03e820cc6fb44
--- /dev/null
+++ b/model_00038-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b00cf8536d13000c50a74d2051ad99405e30cd4ca9f12105d8969e48bc29bd51
+size 4932875543
diff --git a/model_00039-of-00072.safetensors b/model_00039-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..928ccb9a000c55e9ff6a4933f9a8c9c928e1e6c1
--- /dev/null
+++ b/model_00039-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69f087d035224b20881afe98e5db0a68b438a891b4d53bf4b598c853aecf25bf
+size 4932875543
diff --git a/model_00040-of-00072.safetensors b/model_00040-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..375d41e8148cde63ba89548c5115d3015957bb26
--- /dev/null
+++ b/model_00040-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b3dc468943c23e4552400e1ef1d703c5a48f56ed9b50180278f4af8b0169844f
+size 4932875543
diff --git a/model_00041-of-00072.safetensors b/model_00041-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7a557e6ad541df61f04edb89a2c4bd5104d8d6fe
--- /dev/null
+++ b/model_00041-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:081720fa9373987be0555ab87aeeb0152c55154d520f5b2194fd61bcd424f5ea
+size 4932875543
diff --git a/model_00042-of-00072.safetensors b/model_00042-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f6dc6153bc2a591fa0c49b6f1089232073e7bd50
--- /dev/null
+++ b/model_00042-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:83778fe861ea1d3899fb16cb8b415cc7cef46834156b62930bcf6355554dc6d0
+size 4932875543
diff --git a/model_00043-of-00072.safetensors b/model_00043-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b01b246c3bf4fab2fb6f2868f60d411f8e89c1d2
--- /dev/null
+++ b/model_00043-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b595b6aa4ea1650719dbd86c4c5691356bf23d5b74ee6a61898b3ea31b0fc6f
+size 4932875543
diff --git a/model_00044-of-00072.safetensors b/model_00044-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f2daec58f722faa40e900c0dcec4ae615e17f763
--- /dev/null
+++ b/model_00044-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c89aabdea4b993eb0f7f996005559bb3f52cf1997f4ded797aba36765c73aad
+size 4932875543
diff --git a/model_00045-of-00072.safetensors b/model_00045-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..560715c6ed6717277991a419a64a6e978bc199c6
--- /dev/null
+++ b/model_00045-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:54e034d46c4db8c91188860c40b64bf5c00e3b5064dc46a9152acabf8ac14ef9
+size 4932875543
diff --git a/model_00046-of-00072.safetensors b/model_00046-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..89078124d6b0ab83667a425e09e1b56f17a77df1
--- /dev/null
+++ b/model_00046-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:61559dec39143c7a1197c82612bf17a78c438e51dc821ddf6e49cbdd1e877f1a
+size 4932875543
diff --git a/model_00047-of-00072.safetensors b/model_00047-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c1354e5aacd329c783b7bb27d8dab24e9a1f4bfc
--- /dev/null
+++ b/model_00047-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c97f83d253b9afa0b2fbfcbca421d02c3ee3f51efebc1cd9d85d7b3d230b1ead
+size 4932875543
diff --git a/model_00048-of-00072.safetensors b/model_00048-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8fc59b73db5da20d856729df192453d90e3595b3
--- /dev/null
+++ b/model_00048-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:513e2a76f92420713f3adcf1264ccdf9b9c26ba632222d5a8483372fc4516f74
+size 4932875543
diff --git a/model_00049-of-00072.safetensors b/model_00049-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..65d4b01dd14fc66e34a10ced550ccd0d2f48420a
--- /dev/null
+++ b/model_00049-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e1bf07b579cc0e5ebcf762339e2924315c8297332a81219da8e8fd5cfa8e1872
+size 4932875543
diff --git a/model_00050-of-00072.safetensors b/model_00050-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0297b62124ed49f2c0c1752b184c7f2214a310f9
--- /dev/null
+++ b/model_00050-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:50d02230047ca9839a4cb15ee4ff794edd97342df9faa08bf8a4876ec5904753
+size 4932875543
diff --git a/model_00051-of-00072.safetensors b/model_00051-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5246577ea42bd2cd70e4cb3979e7ec9bb1ef95a7
--- /dev/null
+++ b/model_00051-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7b6245728fae397b0fc0104c52c978663556c2a96959f07b594dbc1115ed996
+size 4932875543
diff --git a/model_00052-of-00072.safetensors b/model_00052-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1f164d5934b3c0780eff6c9628ff2a3dede61e54
--- /dev/null
+++ b/model_00052-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b5eccaeb58cc34ba590084e6dad261d56770b3cfa63cda813b3377888241f800
+size 4932875543
diff --git a/model_00053-of-00072.safetensors b/model_00053-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a201213fa3bc03dfb496d4466f3f24527a24b1b5
--- /dev/null
+++ b/model_00053-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48821213ce3118097146b4556a77b6ce76b825c21a6653cabddb08f931ca6b98
+size 4932875543
diff --git a/model_00054-of-00072.safetensors b/model_00054-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a32bec456feea3e846405037544087d5f1ae9609
--- /dev/null
+++ b/model_00054-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:293a797ad623652d18f4b4c2a8fc37cda8e7bcb5f557bdee2cadeede92b362d9
+size 4932875543
diff --git a/model_00055-of-00072.safetensors b/model_00055-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a4521d7a52ab056eda1161c9d38ccc10b6cd5e2c
--- /dev/null
+++ b/model_00055-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ba61f2b542cbe8ba87a8cb262581fdaa61dfb831e7f40966a16167e051be4c5b
+size 4932875543
diff --git a/model_00056-of-00072.safetensors b/model_00056-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b404e004f97c94f9d52d952a26e47e42f6db67fc
--- /dev/null
+++ b/model_00056-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c2eb8d3575c2304a3e7d29156f08182c45b80ea33be8cfbc01aef878c1972ea9
+size 4932875543
diff --git a/model_00057-of-00072.safetensors b/model_00057-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5f1396e0f655298c7cedf6c918ac0fad77f5293f
--- /dev/null
+++ b/model_00057-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dba03ba7f74433d52937ca0314ba408736d440615bd470f78565e48bd6b22761
+size 4932875543
diff --git a/model_00058-of-00072.safetensors b/model_00058-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9e19b76313e7e2da82e268598b5060fa4014b74b
--- /dev/null
+++ b/model_00058-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:99bf90726291ca8be1d822c1f83edebc0b2d28c1af7d1f3434431a574505137f
+size 4932875543
diff --git a/model_00059-of-00072.safetensors b/model_00059-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..55e52ffa7ecfc92ba293176dcdabe03a77e9219f
--- /dev/null
+++ b/model_00059-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:435e8b6b876d6848a5be4a94666186fab8d744797c542d508d79f616cbd828eb
+size 4932875543
diff --git a/model_00060-of-00072.safetensors b/model_00060-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c80ea2e1063f18c6b38bf29391234bf422e1e20c
--- /dev/null
+++ b/model_00060-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec52f43d3b7c47a047e343bec140a1ec722dcdc4e2428ec51949de8a9f9be048
+size 4932875543
diff --git a/model_00061-of-00072.safetensors b/model_00061-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6acf035234524c5e00bf07bf37e1cb081313f2ab
--- /dev/null
+++ b/model_00061-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cc2936f6d312083fb1330a382957230e7fcac20de6a033e17eef65656faf0f70
+size 4932875543
diff --git a/model_00062-of-00072.safetensors b/model_00062-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2738dc6ad35b430ddbadc0c25138f59b21a6ff53
--- /dev/null
+++ b/model_00062-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:277fb5c564cff321888294f76af04cda7bb6a6140db377e85e85b92d378ed682
+size 4932875543
diff --git a/model_00063-of-00072.safetensors b/model_00063-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b6cb595b340c754e7d710e9a2df7e729a7472c8b
--- /dev/null
+++ b/model_00063-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9005b11cc55a23a8b233d48c6b09e2e76777e055fdfc6f3576c96c761ebb6cb6
+size 4932875543
diff --git a/model_00064-of-00072.safetensors b/model_00064-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2c6000dd18044d418b8fb70c2cc54d72c5f930b3
--- /dev/null
+++ b/model_00064-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f819994ebb58a3e6504468f57f9a3c0e54d1f3aaecac3c460477dac2a96bdab0
+size 4932875543
diff --git a/model_00065-of-00072.safetensors b/model_00065-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d38db92c8943623a9e470f01c638188f1961aae2
--- /dev/null
+++ b/model_00065-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf02ef74d2a68edd7a683234669c6e2580de0f55349414033cd12666a91d2f67
+size 4932875543
diff --git a/model_00066-of-00072.safetensors b/model_00066-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..aaae06eb78ddfda60a7ed3dad37f1ae5800b492d
--- /dev/null
+++ b/model_00066-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:94d4ba51fe5b4415a59cf7d88b604412bcd075dd6598d499b625730e07e140c3
+size 4932875543
diff --git a/model_00067-of-00072.safetensors b/model_00067-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d6d1c915efcc0bd2506531711d53cef1b46f39e5
--- /dev/null
+++ b/model_00067-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f8df4082e76d2efec5c522b3bae36026448fc7f5cf9a3924dd783ce19fe8f6a0
+size 4932875543
diff --git a/model_00068-of-00072.safetensors b/model_00068-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7e2aa2fe388a284b9324c5d0bb83463f89843133
--- /dev/null
+++ b/model_00068-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff3508f70a5040be6288e53327d93fb7f4b3956068d2441a47e14697bff1613b
+size 4932875543
diff --git a/model_00069-of-00072.safetensors b/model_00069-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..00e25a648670635cb1818b280223ee5f3f3590b8
--- /dev/null
+++ b/model_00069-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6e681ce4abfd3845426a8538997eba33f45465e812e319d38feb016606c20f68
+size 4932875543
diff --git a/model_00070-of-00072.safetensors b/model_00070-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..983f96a113a641152b3d77dad85093f643c1df88
--- /dev/null
+++ b/model_00070-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f548ea5bb601fb88113068dc3118c63e247dcb10efd73e42f2d690695469cd9d
+size 4932875543
diff --git a/model_00071-of-00072.safetensors b/model_00071-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ee532f9029648aaa560778b30c7386ea3c491e57
--- /dev/null
+++ b/model_00071-of-00072.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6053926852f6726220d154581e20b7286d7cfe6912268bdbfcf49d4aa5b68b0a
+size 4932875543
diff --git a/model_00072-of-00072.safetensors b/model_00072-of-00072.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f8fb4c8f7a02ce97597a27329195ccc2c1128648
Binary files /dev/null and b/model_00072-of-00072.safetensors differ