Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1d3b6f1d26d70b32bd690ea723f7285630fc85fd9de61ff2e08e860b0b6bad1
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80ffce1f241a0b536689d65dbcc7108256c00e973ec986af2321c53369120623
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71aeaa957f88479af7c27b53efd60e2df95a117803180d6b77e51ace5f1fda91
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e107e1af5d4f759da5e1e45249a96f8bff5f48a9f386e4d6619d5397beacdae5
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -1,3 +1,7 @@
|
|
1 |
{"current_steps": 10, "total_steps": 69, "loss": 1.0642, "lr": 5e-06, "epoch": 0.42328042328042326, "percentage": 14.49, "elapsed_time": "0:05:23", "remaining_time": "0:31:48"}
|
2 |
{"current_steps": 20, "total_steps": 69, "loss": 0.9362, "lr": 5e-06, "epoch": 0.8465608465608465, "percentage": 28.99, "elapsed_time": "0:10:38", "remaining_time": "0:26:03"}
|
3 |
{"current_steps": 23, "total_steps": 69, "eval_loss": 0.9042366743087769, "epoch": 0.9735449735449735, "percentage": 33.33, "elapsed_time": "0:12:42", "remaining_time": "0:25:24"}
|
|
|
|
|
|
|
|
|
|
1 |
{"current_steps": 10, "total_steps": 69, "loss": 1.0642, "lr": 5e-06, "epoch": 0.42328042328042326, "percentage": 14.49, "elapsed_time": "0:05:23", "remaining_time": "0:31:48"}
|
2 |
{"current_steps": 20, "total_steps": 69, "loss": 0.9362, "lr": 5e-06, "epoch": 0.8465608465608465, "percentage": 28.99, "elapsed_time": "0:10:38", "remaining_time": "0:26:03"}
|
3 |
{"current_steps": 23, "total_steps": 69, "eval_loss": 0.9042366743087769, "epoch": 0.9735449735449735, "percentage": 33.33, "elapsed_time": "0:12:42", "remaining_time": "0:25:24"}
|
4 |
+
{"current_steps": 30, "total_steps": 69, "loss": 0.9376, "lr": 5e-06, "epoch": 1.2804232804232805, "percentage": 43.48, "elapsed_time": "0:17:25", "remaining_time": "0:22:39"}
|
5 |
+
{"current_steps": 40, "total_steps": 69, "loss": 0.8478, "lr": 5e-06, "epoch": 1.7037037037037037, "percentage": 57.97, "elapsed_time": "0:22:41", "remaining_time": "0:16:26"}
|
6 |
+
{"current_steps": 46, "total_steps": 69, "eval_loss": 0.8493698835372925, "epoch": 1.9576719576719577, "percentage": 66.67, "elapsed_time": "0:26:26", "remaining_time": "0:13:13"}
|
7 |
+
{"current_steps": 50, "total_steps": 69, "loss": 0.8658, "lr": 5e-06, "epoch": 2.1375661375661377, "percentage": 72.46, "elapsed_time": "0:29:30", "remaining_time": "0:11:12"}
|