Training in progress, epoch 1

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4c7769dc968fbfe4c6430594fa2937fb10a1651a35b250ac35a0e928aafb925c
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:aac06ac3245c40add09c6b9ac5546cf12f2a11dab2b219df6b4883087c68e758
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c169681f94d906e79fc39e42397fda2436c48cfde94040beebaa956ffd5f4178
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:1101b5f347b71f407e76292444c4a5f9f54d84e91fecc380b1ceb00fb392e3b5
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9e641b74c9b89270891a37f86ae397ca2b2c2c68a8ab25deb2ace062a325cb22
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c29702af94b4100cb5cf273f3309918b982f8fa4c2e72b217526c1bb81b00e2
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:933b30d6692dc14502c7014498e882b80e48a5ce57cd090f4248173e341db53c
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:66e0f3cbf07530c22d4b75cba1444c47d089cf759bd4c7edba5e7eb20f445ff6
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -2,3 +2,7 @@
 {"current_steps": 20, "total_steps": 96, "loss": 0.6358, "lr": 5e-06, "epoch": 0.6106870229007634, "percentage": 20.83, "elapsed_time": "0:10:51", "remaining_time": "0:41:15"}
 {"current_steps": 30, "total_steps": 96, "loss": 0.5846, "lr": 5e-06, "epoch": 0.916030534351145, "percentage": 31.25, "elapsed_time": "0:16:12", "remaining_time": "0:35:40"}
 {"current_steps": 32, "total_steps": 96, "eval_loss": 0.5693601965904236, "epoch": 0.9770992366412213, "percentage": 33.33, "elapsed_time": "0:18:04", "remaining_time": "0:36:08"}

 {"current_steps": 20, "total_steps": 96, "loss": 0.6358, "lr": 5e-06, "epoch": 0.6106870229007634, "percentage": 20.83, "elapsed_time": "0:10:51", "remaining_time": "0:41:15"}
 {"current_steps": 30, "total_steps": 96, "loss": 0.5846, "lr": 5e-06, "epoch": 0.916030534351145, "percentage": 31.25, "elapsed_time": "0:16:12", "remaining_time": "0:35:40"}
 {"current_steps": 32, "total_steps": 96, "eval_loss": 0.5693601965904236, "epoch": 0.9770992366412213, "percentage": 33.33, "elapsed_time": "0:18:04", "remaining_time": "0:36:08"}
+{"current_steps": 40, "total_steps": 96, "loss": 0.5516, "lr": 5e-06, "epoch": 1.2213740458015268, "percentage": 41.67, "elapsed_time": "0:23:10", "remaining_time": "0:32:26"}
+{"current_steps": 50, "total_steps": 96, "loss": 0.5098, "lr": 5e-06, "epoch": 1.5267175572519083, "percentage": 52.08, "elapsed_time": "0:28:31", "remaining_time": "0:26:14"}
+{"current_steps": 60, "total_steps": 96, "loss": 0.4986, "lr": 5e-06, "epoch": 1.83206106870229, "percentage": 62.5, "elapsed_time": "0:33:52", "remaining_time": "0:20:19"}
+{"current_steps": 65, "total_steps": 96, "eval_loss": 0.5270054340362549, "epoch": 1.984732824427481, "percentage": 67.71, "elapsed_time": "0:37:06", "remaining_time": "0:17:41"}