sedrickkeh
commited on
Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5fd034415dfc6174fb8a167a43c022e2da909b987cf83050b3ff6464beeb866
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b56f755c8ae56fdfb10c2e371b124f4eff899abee9ea1ccc89f29b865335b214
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1f6bf3e71a4d75448e4dd27eba070970047cc1a108bdd1962f45b96c98c5732
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8386986c7bd233d6ff3486c0f217b979077162e102ea2ee3d36f5e60aa6be505
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -38,3 +38,22 @@
|
|
38 |
{"current_steps": 370, "total_steps": 576, "loss": 0.4969, "lr": 5e-06, "epoch": 1.9233268356075373, "percentage": 64.24, "elapsed_time": "3:21:07", "remaining_time": "1:51:58"}
|
39 |
{"current_steps": 380, "total_steps": 576, "loss": 0.5116, "lr": 5e-06, "epoch": 1.9753086419753085, "percentage": 65.97, "elapsed_time": "3:26:28", "remaining_time": "1:46:29"}
|
40 |
{"current_steps": 384, "total_steps": 576, "eval_loss": 0.5507273077964783, "epoch": 1.996101364522417, "percentage": 66.67, "elapsed_time": "3:31:09", "remaining_time": "1:45:34"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
38 |
{"current_steps": 370, "total_steps": 576, "loss": 0.4969, "lr": 5e-06, "epoch": 1.9233268356075373, "percentage": 64.24, "elapsed_time": "3:21:07", "remaining_time": "1:51:58"}
|
39 |
{"current_steps": 380, "total_steps": 576, "loss": 0.5116, "lr": 5e-06, "epoch": 1.9753086419753085, "percentage": 65.97, "elapsed_time": "3:26:28", "remaining_time": "1:46:29"}
|
40 |
{"current_steps": 384, "total_steps": 576, "eval_loss": 0.5507273077964783, "epoch": 1.996101364522417, "percentage": 66.67, "elapsed_time": "3:31:09", "remaining_time": "1:45:34"}
|
41 |
+
{"current_steps": 390, "total_steps": 576, "loss": 0.5155, "lr": 5e-06, "epoch": 2.02729044834308, "percentage": 67.71, "elapsed_time": "3:35:19", "remaining_time": "1:42:41"}
|
42 |
+
{"current_steps": 400, "total_steps": 576, "loss": 0.4578, "lr": 5e-06, "epoch": 2.079272254710851, "percentage": 69.44, "elapsed_time": "3:40:41", "remaining_time": "1:37:06"}
|
43 |
+
{"current_steps": 410, "total_steps": 576, "loss": 0.4704, "lr": 5e-06, "epoch": 2.1312540610786224, "percentage": 71.18, "elapsed_time": "3:46:04", "remaining_time": "1:31:31"}
|
44 |
+
{"current_steps": 420, "total_steps": 576, "loss": 0.4637, "lr": 5e-06, "epoch": 2.1832358674463936, "percentage": 72.92, "elapsed_time": "3:51:25", "remaining_time": "1:25:57"}
|
45 |
+
{"current_steps": 430, "total_steps": 576, "loss": 0.4622, "lr": 5e-06, "epoch": 2.235217673814165, "percentage": 74.65, "elapsed_time": "3:56:45", "remaining_time": "1:20:23"}
|
46 |
+
{"current_steps": 440, "total_steps": 576, "loss": 0.4607, "lr": 5e-06, "epoch": 2.287199480181936, "percentage": 76.39, "elapsed_time": "4:02:05", "remaining_time": "1:14:49"}
|
47 |
+
{"current_steps": 450, "total_steps": 576, "loss": 0.4622, "lr": 5e-06, "epoch": 2.3391812865497075, "percentage": 78.12, "elapsed_time": "4:07:26", "remaining_time": "1:09:17"}
|
48 |
+
{"current_steps": 460, "total_steps": 576, "loss": 0.4682, "lr": 5e-06, "epoch": 2.3911630929174787, "percentage": 79.86, "elapsed_time": "4:12:49", "remaining_time": "1:03:45"}
|
49 |
+
{"current_steps": 470, "total_steps": 576, "loss": 0.4594, "lr": 5e-06, "epoch": 2.44314489928525, "percentage": 81.6, "elapsed_time": "4:18:11", "remaining_time": "0:58:13"}
|
50 |
+
{"current_steps": 480, "total_steps": 576, "loss": 0.4675, "lr": 5e-06, "epoch": 2.4951267056530213, "percentage": 83.33, "elapsed_time": "4:23:33", "remaining_time": "0:52:42"}
|
51 |
+
{"current_steps": 490, "total_steps": 576, "loss": 0.4659, "lr": 5e-06, "epoch": 2.5471085120207926, "percentage": 85.07, "elapsed_time": "4:28:55", "remaining_time": "0:47:11"}
|
52 |
+
{"current_steps": 500, "total_steps": 576, "loss": 0.4588, "lr": 5e-06, "epoch": 2.599090318388564, "percentage": 86.81, "elapsed_time": "4:34:18", "remaining_time": "0:41:41"}
|
53 |
+
{"current_steps": 510, "total_steps": 576, "loss": 0.4634, "lr": 5e-06, "epoch": 2.651072124756335, "percentage": 88.54, "elapsed_time": "4:39:40", "remaining_time": "0:36:11"}
|
54 |
+
{"current_steps": 520, "total_steps": 576, "loss": 0.4642, "lr": 5e-06, "epoch": 2.7030539311241064, "percentage": 90.28, "elapsed_time": "4:45:01", "remaining_time": "0:30:41"}
|
55 |
+
{"current_steps": 530, "total_steps": 576, "loss": 0.4658, "lr": 5e-06, "epoch": 2.7550357374918777, "percentage": 92.01, "elapsed_time": "4:50:21", "remaining_time": "0:25:12"}
|
56 |
+
{"current_steps": 540, "total_steps": 576, "loss": 0.4712, "lr": 5e-06, "epoch": 2.807017543859649, "percentage": 93.75, "elapsed_time": "4:55:42", "remaining_time": "0:19:42"}
|
57 |
+
{"current_steps": 550, "total_steps": 576, "loss": 0.4672, "lr": 5e-06, "epoch": 2.8589993502274202, "percentage": 95.49, "elapsed_time": "5:01:04", "remaining_time": "0:14:13"}
|
58 |
+
{"current_steps": 560, "total_steps": 576, "loss": 0.4682, "lr": 5e-06, "epoch": 2.9109811565951915, "percentage": 97.22, "elapsed_time": "5:06:27", "remaining_time": "0:08:45"}
|
59 |
+
{"current_steps": 570, "total_steps": 576, "loss": 0.4569, "lr": 5e-06, "epoch": 2.962962962962963, "percentage": 98.96, "elapsed_time": "5:11:49", "remaining_time": "0:03:16"}
|