Training in progress, epoch 10
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:702212b10cc463d924e99c70e9f4f9df3bdfca009b4293ff5cbc3fca27ebc13b
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e383e72af5f3daad0e914e987f58f24a6e079f0bf1eaf42cc25ae8eb40a0bc7
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ec2172fb389f7d6d0f1fbe2aedcea91347b4e8076e822b3719792f6ac065777
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27e49ecfebf15c5b00e35e9871ab0b3493b5fa19ca83ff50ed6c15fec7256c6b
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -102,3 +102,13 @@
|
|
| 102 |
{"current_steps": 102, "total_steps": 117, "loss": 0.0845, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "0:40:44", "remaining_time": "0:05:59"}
|
| 103 |
{"current_steps": 103, "total_steps": 117, "loss": 0.0676, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "0:41:02", "remaining_time": "0:05:34"}
|
| 104 |
{"current_steps": 104, "total_steps": 117, "loss": 0.0592, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "0:41:19", "remaining_time": "0:05:09"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 102 |
{"current_steps": 102, "total_steps": 117, "loss": 0.0845, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "0:40:44", "remaining_time": "0:05:59"}
|
| 103 |
{"current_steps": 103, "total_steps": 117, "loss": 0.0676, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "0:41:02", "remaining_time": "0:05:34"}
|
| 104 |
{"current_steps": 104, "total_steps": 117, "loss": 0.0592, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "0:41:19", "remaining_time": "0:05:09"}
|
| 105 |
+
{"current_steps": 105, "total_steps": 117, "loss": 0.0593, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "0:42:28", "remaining_time": "0:04:51"}
|
| 106 |
+
{"current_steps": 106, "total_steps": 117, "loss": 0.0818, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "0:42:49", "remaining_time": "0:04:26"}
|
| 107 |
+
{"current_steps": 107, "total_steps": 117, "loss": 0.0502, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "0:43:01", "remaining_time": "0:04:01"}
|
| 108 |
+
{"current_steps": 108, "total_steps": 117, "loss": 0.0626, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "0:43:15", "remaining_time": "0:03:36"}
|
| 109 |
+
{"current_steps": 109, "total_steps": 117, "loss": 0.0793, "lr": 1.4254980853566248e-07, "epoch": 11.455696202531646, "percentage": 93.16, "elapsed_time": "0:43:37", "remaining_time": "0:03:12"}
|
| 110 |
+
{"current_steps": 110, "total_steps": 117, "loss": 0.0735, "lr": 1.0926199633097156e-07, "epoch": 11.556962025316455, "percentage": 94.02, "elapsed_time": "0:43:53", "remaining_time": "0:02:47"}
|
| 111 |
+
{"current_steps": 111, "total_steps": 117, "loss": 0.0961, "lr": 8.035205700685167e-08, "epoch": 11.658227848101266, "percentage": 94.87, "elapsed_time": "0:44:15", "remaining_time": "0:02:23"}
|
| 112 |
+
{"current_steps": 112, "total_steps": 117, "loss": 0.067, "lr": 5.584586887435739e-08, "epoch": 11.759493670886076, "percentage": 95.73, "elapsed_time": "0:44:33", "remaining_time": "0:01:59"}
|
| 113 |
+
{"current_steps": 113, "total_steps": 117, "loss": 0.0847, "lr": 3.576536829081323e-08, "epoch": 11.860759493670885, "percentage": 96.58, "elapsed_time": "0:44:56", "remaining_time": "0:01:35"}
|
| 114 |
+
{"current_steps": 114, "total_steps": 117, "loss": 0.0645, "lr": 2.012853002380466e-08, "epoch": 11.962025316455696, "percentage": 97.44, "elapsed_time": "0:45:13", "remaining_time": "0:01:11"}
|