Training in progress, epoch 1

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ccc6562e39b1aef1f3c8393b76942e5217e02b25371469a934cfb2576505707
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:a1d3b6f1d26d70b32bd690ea723f7285630fc85fd9de61ff2e08e860b0b6bad1
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:99a792725e77604dc6393b772a2ee4bde9f08701908c4dd58f8b08f6607eedbf
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:80ffce1f241a0b536689d65dbcc7108256c00e973ec986af2321c53369120623
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3cfab223a4ddc4c74dadfaa08d160f23640a7a13ef06dd4ab5a1a907e45c0676
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:71aeaa957f88479af7c27b53efd60e2df95a117803180d6b77e51ace5f1fda91
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f66779a616603967f41d59f299b84b1ed4855b75ec52408439d54d1dd7ed656e
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:e107e1af5d4f759da5e1e45249a96f8bff5f48a9f386e4d6619d5397beacdae5
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -1,3 +1,7 @@
 {"current_steps": 10, "total_steps": 69, "loss": 1.0642, "lr": 5e-06, "epoch": 0.42328042328042326, "percentage": 14.49, "elapsed_time": "0:05:23", "remaining_time": "0:31:48"}
 {"current_steps": 20, "total_steps": 69, "loss": 0.9362, "lr": 5e-06, "epoch": 0.8465608465608465, "percentage": 28.99, "elapsed_time": "0:10:38", "remaining_time": "0:26:03"}
 {"current_steps": 23, "total_steps": 69, "eval_loss": 0.9042366743087769, "epoch": 0.9735449735449735, "percentage": 33.33, "elapsed_time": "0:12:42", "remaining_time": "0:25:24"}

 {"current_steps": 10, "total_steps": 69, "loss": 1.0642, "lr": 5e-06, "epoch": 0.42328042328042326, "percentage": 14.49, "elapsed_time": "0:05:23", "remaining_time": "0:31:48"}
 {"current_steps": 20, "total_steps": 69, "loss": 0.9362, "lr": 5e-06, "epoch": 0.8465608465608465, "percentage": 28.99, "elapsed_time": "0:10:38", "remaining_time": "0:26:03"}
 {"current_steps": 23, "total_steps": 69, "eval_loss": 0.9042366743087769, "epoch": 0.9735449735449735, "percentage": 33.33, "elapsed_time": "0:12:42", "remaining_time": "0:25:24"}
+{"current_steps": 30, "total_steps": 69, "loss": 0.9376, "lr": 5e-06, "epoch": 1.2804232804232805, "percentage": 43.48, "elapsed_time": "0:17:25", "remaining_time": "0:22:39"}
+{"current_steps": 40, "total_steps": 69, "loss": 0.8478, "lr": 5e-06, "epoch": 1.7037037037037037, "percentage": 57.97, "elapsed_time": "0:22:41", "remaining_time": "0:16:26"}
+{"current_steps": 46, "total_steps": 69, "eval_loss": 0.8493698835372925, "epoch": 1.9576719576719577, "percentage": 66.67, "elapsed_time": "0:26:26", "remaining_time": "0:13:13"}
+{"current_steps": 50, "total_steps": 69, "loss": 0.8658, "lr": 5e-06, "epoch": 2.1375661375661377, "percentage": 72.46, "elapsed_time": "0:29:30", "remaining_time": "0:11:12"}