Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88d9853b50fedfd085a56b8b5c514828e632b3623fc1032220551e1e02f933e5
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8cf86c6179a5a59d0018e7f3c1eefa8ebeda3cb3743a1104c9749e046b7c43fa
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d4bd59dfac413584c46ea6da76e22303f6710ada932795fa8637807f1441781
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13067522065f80d18728ddd25e1bcd6cee7e8ae73579daa5a64bdcb0e8351483
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -19,3 +19,19 @@
|
|
| 19 |
{"current_steps": 19, "total_steps": 48, "loss": 0.7302, "lr": 7.604701702439652e-06, "epoch": 1.1875, "percentage": 39.58, "elapsed_time": "0:10:05", "remaining_time": "0:15:24"}
|
| 20 |
{"current_steps": 20, "total_steps": 48, "loss": 0.8066, "lr": 7.286211616523193e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:10:32", "remaining_time": "0:14:45"}
|
| 21 |
{"current_steps": 21, "total_steps": 48, "loss": 0.7155, "lr": 6.95552360245078e-06, "epoch": 1.3125, "percentage": 43.75, "elapsed_time": "0:10:58", "remaining_time": "0:14:07"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 19 |
{"current_steps": 19, "total_steps": 48, "loss": 0.7302, "lr": 7.604701702439652e-06, "epoch": 1.1875, "percentage": 39.58, "elapsed_time": "0:10:05", "remaining_time": "0:15:24"}
|
| 20 |
{"current_steps": 20, "total_steps": 48, "loss": 0.8066, "lr": 7.286211616523193e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:10:32", "remaining_time": "0:14:45"}
|
| 21 |
{"current_steps": 21, "total_steps": 48, "loss": 0.7155, "lr": 6.95552360245078e-06, "epoch": 1.3125, "percentage": 43.75, "elapsed_time": "0:10:58", "remaining_time": "0:14:07"}
|
| 22 |
+
{"current_steps": 22, "total_steps": 48, "loss": 0.7416, "lr": 6.614402023857231e-06, "epoch": 1.375, "percentage": 45.83, "elapsed_time": "0:11:27", "remaining_time": "0:13:32"}
|
| 23 |
+
{"current_steps": 23, "total_steps": 48, "loss": 0.7355, "lr": 6.264666911958404e-06, "epoch": 1.4375, "percentage": 47.92, "elapsed_time": "0:12:00", "remaining_time": "0:13:02"}
|
| 24 |
+
{"current_steps": 24, "total_steps": 48, "loss": 0.7514, "lr": 5.908184254897183e-06, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "0:12:29", "remaining_time": "0:12:29"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 48, "loss": 0.7772, "lr": 5.546856041889374e-06, "epoch": 1.5625, "percentage": 52.08, "elapsed_time": "0:12:57", "remaining_time": "0:11:55"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 48, "loss": 0.7391, "lr": 5.182610115288296e-06, "epoch": 1.625, "percentage": 54.17, "elapsed_time": "0:13:23", "remaining_time": "0:11:19"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 48, "loss": 0.7486, "lr": 4.817389884711706e-06, "epoch": 1.6875, "percentage": 56.25, "elapsed_time": "0:13:54", "remaining_time": "0:10:49"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 48, "loss": 0.7909, "lr": 4.4531439581106295e-06, "epoch": 1.75, "percentage": 58.33, "elapsed_time": "0:14:25", "remaining_time": "0:10:18"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 48, "loss": 0.7535, "lr": 4.091815745102818e-06, "epoch": 1.8125, "percentage": 60.42, "elapsed_time": "0:14:51", "remaining_time": "0:09:44"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 48, "loss": 0.7276, "lr": 3.7353330880415963e-06, "epoch": 1.875, "percentage": 62.5, "elapsed_time": "0:15:15", "remaining_time": "0:09:09"}
|
| 31 |
+
{"current_steps": 31, "total_steps": 48, "loss": 0.7982, "lr": 3.3855979761427705e-06, "epoch": 1.9375, "percentage": 64.58, "elapsed_time": "0:15:43", "remaining_time": "0:08:37"}
|
| 32 |
+
{"current_steps": 32, "total_steps": 48, "loss": 0.7689, "lr": 3.044476397549221e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:16:18", "remaining_time": "0:08:09"}
|
| 33 |
+
{"current_steps": 33, "total_steps": 48, "loss": 0.735, "lr": 2.7137883834768076e-06, "epoch": 2.0625, "percentage": 68.75, "elapsed_time": "0:17:38", "remaining_time": "0:08:01"}
|
| 34 |
+
{"current_steps": 34, "total_steps": 48, "loss": 0.772, "lr": 2.3952982975603494e-06, "epoch": 2.125, "percentage": 70.83, "elapsed_time": "0:18:03", "remaining_time": "0:07:26"}
|
| 35 |
+
{"current_steps": 35, "total_steps": 48, "loss": 0.7111, "lr": 2.0907054222102367e-06, "epoch": 2.1875, "percentage": 72.92, "elapsed_time": "0:18:41", "remaining_time": "0:06:56"}
|
| 36 |
+
{"current_steps": 36, "total_steps": 48, "loss": 0.6825, "lr": 1.8016348922055448e-06, "epoch": 2.25, "percentage": 75.0, "elapsed_time": "0:19:13", "remaining_time": "0:06:24"}
|
| 37 |
+
{"current_steps": 37, "total_steps": 48, "loss": 0.6869, "lr": 1.5296290238968303e-06, "epoch": 2.3125, "percentage": 77.08, "elapsed_time": "0:19:45", "remaining_time": "0:05:52"}
|