Training in progress, step 10, checkpoint

Files changed (6) hide show

checkpoint-10/adapter_config.json CHANGED Viewed

@@ -20,8 +20,8 @@
   "revision": null,
   "target_modules": [
     "q_proj",
-    "o_proj",
     "k_proj",
     "v_proj"
   ],
   "task_type": "CAUSAL_LM",

   "revision": null,
   "target_modules": [
     "q_proj",
     "k_proj",
+    "o_proj",
     "v_proj"
   ],
   "task_type": "CAUSAL_LM",

checkpoint-10/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9816cbecf0d2326a067711f94d8fdace56f34b21cae6bea2a64a94672f5a0b6b
 size 27297032

 version https://git-lfs.github.com/spec/v1
+oid sha256:ad7edadd0173530939f388f4b5aeca9bb6ff6d497bbf0605833181cd4db3832d
 size 27297032

checkpoint-10/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:25be627d618d98b88877924ebae77b453f80db9721ded44ce246cf586a1090c6
 size 54678010

 version https://git-lfs.github.com/spec/v1
+oid sha256:78174670b788b2cafec59ee3c5966333c6b8f8c2a4aad0a13fcbd4829fed7796
 size 54678010

checkpoint-10/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e682acd73b606b0f2659ad0f4f8d6e222db7f6b19c61dc2d69ab911f43a9c001
 size 14512

 version https://git-lfs.github.com/spec/v1
+oid sha256:42d83b94c8ac5fc9478b91d2426ff1842349919562d432c6c2618e3dc7fdc544
 size 14512

checkpoint-10/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 1.3349500894546509,
   "best_model_checkpoint": "./mistral/29-02-24-Weni-testing_saving_checkpoints-final_Zeroshot-2_max_steps-60_batch_8_2024-02-29_ppid_7/checkpoint-10",
   "epoch": 0.006199628022318661,
   "eval_steps": 10,
@@ -10,10 +10,10 @@
   "log_history": [
     {
       "epoch": 0.01,
-      "eval_loss": 1.3349500894546509,
-      "eval_runtime": 212.0568,
-      "eval_samples_per_second": 13.52,
-      "eval_steps_per_second": 3.381,
       "step": 10
     }
   ],
@@ -22,7 +22,7 @@
   "num_input_tokens_seen": 0,
   "num_train_epochs": 1,
   "save_steps": 10,
-  "total_flos": 5222974437195776.0,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 1.353695273399353,
   "best_model_checkpoint": "./mistral/29-02-24-Weni-testing_saving_checkpoints-final_Zeroshot-2_max_steps-60_batch_8_2024-02-29_ppid_7/checkpoint-10",
   "epoch": 0.006199628022318661,
   "eval_steps": 10,
   "log_history": [
     {
       "epoch": 0.01,
+      "eval_loss": 1.353695273399353,
+      "eval_runtime": 211.2183,
+      "eval_samples_per_second": 13.574,
+      "eval_steps_per_second": 3.395,
       "step": 10
     }
   ],
   "num_input_tokens_seen": 0,
   "num_train_epochs": 1,
   "save_steps": 10,
+  "total_flos": 4887826864799744.0,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

checkpoint-10/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:09451dd342dbcd48b4952803853b975a8bd13b7e94555d226899f1b4fa2438b7
 size 5112

 version https://git-lfs.github.com/spec/v1
+oid sha256:a8e1a7d78795fa69fe8e3bb1a18304b885d78d38897e6462ed8a482e70228ab3
 size 5112