Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aac06ac3245c40add09c6b9ac5546cf12f2a11dab2b219df6b4883087c68e758
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1101b5f347b71f407e76292444c4a5f9f54d84e91fecc380b1ceb00fb392e3b5
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c29702af94b4100cb5cf273f3309918b982f8fa4c2e72b217526c1bb81b00e2
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66e0f3cbf07530c22d4b75cba1444c47d089cf759bd4c7edba5e7eb20f445ff6
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -2,3 +2,7 @@
|
|
| 2 |
{"current_steps": 20, "total_steps": 96, "loss": 0.6358, "lr": 5e-06, "epoch": 0.6106870229007634, "percentage": 20.83, "elapsed_time": "0:10:51", "remaining_time": "0:41:15"}
|
| 3 |
{"current_steps": 30, "total_steps": 96, "loss": 0.5846, "lr": 5e-06, "epoch": 0.916030534351145, "percentage": 31.25, "elapsed_time": "0:16:12", "remaining_time": "0:35:40"}
|
| 4 |
{"current_steps": 32, "total_steps": 96, "eval_loss": 0.5693601965904236, "epoch": 0.9770992366412213, "percentage": 33.33, "elapsed_time": "0:18:04", "remaining_time": "0:36:08"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
{"current_steps": 20, "total_steps": 96, "loss": 0.6358, "lr": 5e-06, "epoch": 0.6106870229007634, "percentage": 20.83, "elapsed_time": "0:10:51", "remaining_time": "0:41:15"}
|
| 3 |
{"current_steps": 30, "total_steps": 96, "loss": 0.5846, "lr": 5e-06, "epoch": 0.916030534351145, "percentage": 31.25, "elapsed_time": "0:16:12", "remaining_time": "0:35:40"}
|
| 4 |
{"current_steps": 32, "total_steps": 96, "eval_loss": 0.5693601965904236, "epoch": 0.9770992366412213, "percentage": 33.33, "elapsed_time": "0:18:04", "remaining_time": "0:36:08"}
|
| 5 |
+
{"current_steps": 40, "total_steps": 96, "loss": 0.5516, "lr": 5e-06, "epoch": 1.2213740458015268, "percentage": 41.67, "elapsed_time": "0:23:10", "remaining_time": "0:32:26"}
|
| 6 |
+
{"current_steps": 50, "total_steps": 96, "loss": 0.5098, "lr": 5e-06, "epoch": 1.5267175572519083, "percentage": 52.08, "elapsed_time": "0:28:31", "remaining_time": "0:26:14"}
|
| 7 |
+
{"current_steps": 60, "total_steps": 96, "loss": 0.4986, "lr": 5e-06, "epoch": 1.83206106870229, "percentage": 62.5, "elapsed_time": "0:33:52", "remaining_time": "0:20:19"}
|
| 8 |
+
{"current_steps": 65, "total_steps": 96, "eval_loss": 0.5270054340362549, "epoch": 1.984732824427481, "percentage": 67.71, "elapsed_time": "0:37:06", "remaining_time": "0:17:41"}
|