Training in progress, epoch 1

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f1a672655c00e411f8a6b77168ea274acd442e2e57c27f37c46a283d390cd557
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:c411998f5aa13b167b4169ea6693741dc84d7361c709b2bb63913c2c63899bc0
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:09f98d46a633dc0111f3bf3fd42d048e9371331a5a1256f8e7bdac6edd1d253a
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:f2816be7f943abf8c7a9a381acb1547de648e60fa475348847826d79da4c60aa
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a69bd72ae63557f31959f2b43f72f3491c1992d00a95afa721893942ceff1638
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:82d564947c65b123ef63cb7a39cb143934bf4c4ca0f50d209ba1b0033d8d9e02
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5952e3a690e18b99a1acf735d38fd2084142fdaced8db9b642baa7a94def9c85
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:87eae362bfd33a24c49a6d745e6d16c1d922e9186fbd9b8f5381ed8432d87453
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -3,3 +3,7 @@
 {"current_steps": 30, "total_steps": 114, "loss": 1.0172, "lr": 5e-06, "epoch": 0.7704654895666132, "percentage": 26.32, "elapsed_time": "1:17:59", "remaining_time": "3:38:21"}
 {"current_steps": 38, "total_steps": 114, "eval_loss": 0.996041476726532, "epoch": 0.9759229534510433, "percentage": 33.33, "elapsed_time": "1:43:11", "remaining_time": "3:26:22"}
 {"current_steps": 40, "total_steps": 114, "loss": 0.9942, "lr": 5e-06, "epoch": 1.0272873194221508, "percentage": 35.09, "elapsed_time": "1:47:21", "remaining_time": "3:18:36"}

 {"current_steps": 30, "total_steps": 114, "loss": 1.0172, "lr": 5e-06, "epoch": 0.7704654895666132, "percentage": 26.32, "elapsed_time": "1:17:59", "remaining_time": "3:38:21"}
 {"current_steps": 38, "total_steps": 114, "eval_loss": 0.996041476726532, "epoch": 0.9759229534510433, "percentage": 33.33, "elapsed_time": "1:43:11", "remaining_time": "3:26:22"}
 {"current_steps": 40, "total_steps": 114, "loss": 0.9942, "lr": 5e-06, "epoch": 1.0272873194221508, "percentage": 35.09, "elapsed_time": "1:47:21", "remaining_time": "3:18:36"}
+{"current_steps": 50, "total_steps": 114, "loss": 0.9489, "lr": 5e-06, "epoch": 1.2841091492776886, "percentage": 43.86, "elapsed_time": "2:13:17", "remaining_time": "2:50:37"}
+{"current_steps": 60, "total_steps": 114, "loss": 0.9348, "lr": 5e-06, "epoch": 1.5409309791332264, "percentage": 52.63, "elapsed_time": "2:39:13", "remaining_time": "2:23:18"}
+{"current_steps": 70, "total_steps": 114, "loss": 0.9304, "lr": 5e-06, "epoch": 1.797752808988764, "percentage": 61.4, "elapsed_time": "3:05:10", "remaining_time": "1:56:23"}
+{"current_steps": 77, "total_steps": 114, "eval_loss": 0.9520364999771118, "epoch": 1.9775280898876404, "percentage": 67.54, "elapsed_time": "3:27:36", "remaining_time": "1:39:45"}