Training in progress, step 110

Files changed (10) hide show

adapter_config.json CHANGED Viewed

@@ -29,13 +29,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "q_proj",
-    "down_proj",
     "up_proj",
-    "o_proj",
     "gate_proj",
-    "k_proj",
-    "v_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "o_proj",
+    "v_proj",
+    "k_proj",
     "q_proj",
     "up_proj",
     "gate_proj",
+    "down_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:60d95b10b6e140a9626a7058d5038528f2ff80148dc4569b881db56052046509
-size 40

 version https://git-lfs.github.com/spec/v1
+oid sha256:c4d4268fbced7e166240d2fd404e3dca36a791adfefec718d3067887406b39a8
+size 335605144

config.json CHANGED Viewed

@@ -18,6 +18,7 @@
   "num_attention_heads": 32,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": {

   "num_attention_heads": 32,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
+  "pad_token_id": 128001,
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": {

generation_config.json CHANGED Viewed

@@ -2,7 +2,10 @@
   "_from_model_config": true,
   "bos_token_id": 128000,
   "do_sample": true,
-  "eos_token_id": 128001,
   "temperature": 0.6,
   "top_p": 0.95,
   "transformers_version": "4.57.1"

   "_from_model_config": true,
   "bos_token_id": 128000,
   "do_sample": true,
+  "eos_token_id": [
+    128001
+  ],
+  "pad_token_id": 128001,
   "temperature": 0.6,
   "top_p": 0.95,
   "transformers_version": "4.57.1"

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:00a90f92cc5605b61a0073398c7225385e2d035612aca045b9d71240bfb77849
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:3e2f1874281ef5e5f9c9fc1ec19710d47fe40bf7058ea969134658f8d1686463
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68438e6709775ab0e8e322a60ae80ebd1f131a378bc2aa7f1e831ef147422ef2
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:3e35564ec1b452ecd3eb081a514ccd022ec8af23a9231644fed0d1456fa71fa8
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:40666efae41cbd67e18ba3620ac5caf3a61e7b666862ae014c99ff94c38d5154
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:7bb86752df561fbf75077a016cb99761d06176ac60dcdd0f82fc1c47979503a2
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc6192f16067485b8e90111208f423ba9a2c323053d4792dc50e20f7a99b816e
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:2e089bac37bd76643d34de725e54ba059c6e05312d087d3d68798fa7d49fb6af
 size 1168138808

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d91915040cfac999d8c55f4b5bc6e67367c065e3a7a4e4b9438ce1f256addd86
-size 17209530

 version https://git-lfs.github.com/spec/v1
+oid sha256:26c881aaf4ef935b1516ec79ad6405dd2a459f2b5d431a8a4a1399c92f3ba022
+size 17209711

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0de2821aab93454e4a327821e4e141f31c7342c176f9e11dfa2b4d0afd1130e8
 size 8760

 version https://git-lfs.github.com/spec/v1
+oid sha256:87f504b40016b12c079540469b81ed1e8baa9535c9cd14bb840a8ed722825f4a
 size 8760