esfrankel17
commited on
Commit
•
0b82567
1
Parent(s):
8ec2ca9
Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:064843fdd202f923a17d6b23dfdd83bf1704b4dc40476dd0d973421c42ea4af6
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05e9af8806620d65be64b2c9555838a129c7b0310fcf44bedf667dd258c43fb2
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35bbf4a8a2627505f83d512bbeb6a96732e3e80aea4764c0e9a24df35cbc620e
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5593fa10ba8c2eaf4349e7420e4995d40981fc3177768c1e886ba8a4a2369e72
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -1,3 +1,5 @@
|
|
1 |
{"current_steps": 10, "total_steps": 48, "loss": 0.8943, "learning_rate": 5e-06, "epoch": 0.625, "percentage": 20.83, "elapsed_time": "0:05:23", "remaining_time": "0:20:28"}
|
2 |
{"current_steps": 16, "total_steps": 48, "eval_loss": 0.8237837553024292, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:08:43", "remaining_time": "0:17:27"}
|
3 |
{"current_steps": 20, "total_steps": 48, "loss": 0.7853, "learning_rate": 5e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:11:47", "remaining_time": "0:16:30"}
|
|
|
|
|
|
1 |
{"current_steps": 10, "total_steps": 48, "loss": 0.8943, "learning_rate": 5e-06, "epoch": 0.625, "percentage": 20.83, "elapsed_time": "0:05:23", "remaining_time": "0:20:28"}
|
2 |
{"current_steps": 16, "total_steps": 48, "eval_loss": 0.8237837553024292, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:08:43", "remaining_time": "0:17:27"}
|
3 |
{"current_steps": 20, "total_steps": 48, "loss": 0.7853, "learning_rate": 5e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:11:47", "remaining_time": "0:16:30"}
|
4 |
+
{"current_steps": 30, "total_steps": 48, "loss": 0.7293, "learning_rate": 5e-06, "epoch": 1.875, "percentage": 62.5, "elapsed_time": "0:17:07", "remaining_time": "0:10:16"}
|
5 |
+
{"current_steps": 32, "total_steps": 48, "eval_loss": 0.7811707258224487, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:18:22", "remaining_time": "0:09:11"}
|