Training in progress, epoch 10
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8adb849e534d02252f56026aaad372f512702c584d434f81bdd42b7135635792
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3798f4231d887ff09e263bd8dedbceb0e03ca2fe407d93dcaa4140ad56c9204
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7ee46fd9e5e360aa1c588f43de99e40475db2ab0eb42de93970422707776603
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4ebdfedcba7ec92e3374ed71b75213ff9c017f4250a87e9dc1ba513a5217c3f
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -100,3 +100,13 @@
|
|
| 100 |
{"current_steps": 100, "total_steps": 117, "loss": 0.1969, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "0:52:01", "remaining_time": "0:08:50"}
|
| 101 |
{"current_steps": 101, "total_steps": 117, "loss": 0.0823, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "0:52:19", "remaining_time": "0:08:17"}
|
| 102 |
{"current_steps": 102, "total_steps": 117, "loss": 0.0915, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "0:52:42", "remaining_time": "0:07:45"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 100 |
{"current_steps": 100, "total_steps": 117, "loss": 0.1969, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "0:52:01", "remaining_time": "0:08:50"}
|
| 101 |
{"current_steps": 101, "total_steps": 117, "loss": 0.0823, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "0:52:19", "remaining_time": "0:08:17"}
|
| 102 |
{"current_steps": 102, "total_steps": 117, "loss": 0.0915, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "0:52:42", "remaining_time": "0:07:45"}
|
| 103 |
+
{"current_steps": 103, "total_steps": 117, "loss": 0.1517, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "0:53:11", "remaining_time": "0:07:13"}
|
| 104 |
+
{"current_steps": 104, "total_steps": 117, "loss": 0.1393, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "0:53:40", "remaining_time": "0:06:42"}
|
| 105 |
+
{"current_steps": 105, "total_steps": 117, "loss": 0.1027, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "0:55:00", "remaining_time": "0:06:17"}
|
| 106 |
+
{"current_steps": 106, "total_steps": 117, "loss": 0.1036, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "0:55:27", "remaining_time": "0:05:45"}
|
| 107 |
+
{"current_steps": 107, "total_steps": 117, "loss": 0.1259, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "0:55:50", "remaining_time": "0:05:13"}
|
| 108 |
+
{"current_steps": 108, "total_steps": 117, "loss": 0.0926, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "0:56:08", "remaining_time": "0:04:40"}
|
| 109 |
+
{"current_steps": 109, "total_steps": 117, "loss": 0.1267, "lr": 1.4254980853566248e-07, "epoch": 11.455696202531646, "percentage": 93.16, "elapsed_time": "0:56:31", "remaining_time": "0:04:08"}
|
| 110 |
+
{"current_steps": 110, "total_steps": 117, "loss": 0.1769, "lr": 1.0926199633097156e-07, "epoch": 11.556962025316455, "percentage": 94.02, "elapsed_time": "0:57:03", "remaining_time": "0:03:37"}
|
| 111 |
+
{"current_steps": 111, "total_steps": 117, "loss": 0.1202, "lr": 8.035205700685167e-08, "epoch": 11.658227848101266, "percentage": 94.87, "elapsed_time": "0:57:30", "remaining_time": "0:03:06"}
|
| 112 |
+
{"current_steps": 112, "total_steps": 117, "loss": 0.1135, "lr": 5.584586887435739e-08, "epoch": 11.759493670886076, "percentage": 95.73, "elapsed_time": "0:57:52", "remaining_time": "0:02:35"}
|