Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bafc57fcaa812d63cc1e3c128e986d0c3ff8659a168d20769bdb06af7ec9ecf0
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30c4873be68ffc42d232a9939b1804d465585089803fcd8c878843ea0a674b5b
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ce62bbcb44cac955a29e1f654a6a28877d3c539b31349933a7e7313126125cb
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67bec0fe378744916e9791f8b17f5743519b45aaad4cfc787eda4fe433ebaf37
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -8,3 +8,9 @@
|
|
8 |
{"current_steps": 70, "total_steps": 123, "loss": 0.7662, "lr": 5e-06, "epoch": 1.6816816816816815, "percentage": 56.91, "elapsed_time": "0:38:48", "remaining_time": "0:29:23"}
|
9 |
{"current_steps": 80, "total_steps": 123, "loss": 0.7594, "lr": 5e-06, "epoch": 1.921921921921922, "percentage": 65.04, "elapsed_time": "0:44:04", "remaining_time": "0:23:41"}
|
10 |
{"current_steps": 83, "total_steps": 123, "eval_loss": 0.777886688709259, "epoch": 1.993993993993994, "percentage": 67.48, "elapsed_time": "0:46:10", "remaining_time": "0:22:15"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8 |
{"current_steps": 70, "total_steps": 123, "loss": 0.7662, "lr": 5e-06, "epoch": 1.6816816816816815, "percentage": 56.91, "elapsed_time": "0:38:48", "remaining_time": "0:29:23"}
|
9 |
{"current_steps": 80, "total_steps": 123, "loss": 0.7594, "lr": 5e-06, "epoch": 1.921921921921922, "percentage": 65.04, "elapsed_time": "0:44:04", "remaining_time": "0:23:41"}
|
10 |
{"current_steps": 83, "total_steps": 123, "eval_loss": 0.777886688709259, "epoch": 1.993993993993994, "percentage": 67.48, "elapsed_time": "0:46:10", "remaining_time": "0:22:15"}
|
11 |
+
{"current_steps": 90, "total_steps": 123, "loss": 0.755, "lr": 5e-06, "epoch": 2.1621621621621623, "percentage": 73.17, "elapsed_time": "0:51:02", "remaining_time": "0:18:42"}
|
12 |
+
{"current_steps": 100, "total_steps": 123, "loss": 0.7095, "lr": 5e-06, "epoch": 2.4024024024024024, "percentage": 81.3, "elapsed_time": "0:56:18", "remaining_time": "0:12:57"}
|
13 |
+
{"current_steps": 110, "total_steps": 123, "loss": 0.7074, "lr": 5e-06, "epoch": 2.6426426426426426, "percentage": 89.43, "elapsed_time": "1:01:33", "remaining_time": "0:07:16"}
|
14 |
+
{"current_steps": 120, "total_steps": 123, "loss": 0.7082, "lr": 5e-06, "epoch": 2.8828828828828827, "percentage": 97.56, "elapsed_time": "1:06:51", "remaining_time": "0:01:40"}
|
15 |
+
{"current_steps": 123, "total_steps": 123, "eval_loss": 0.7722160816192627, "epoch": 2.954954954954955, "percentage": 100.0, "elapsed_time": "1:10:13", "remaining_time": "0:00:00"}
|
16 |
+
{"current_steps": 123, "total_steps": 123, "epoch": 2.954954954954955, "percentage": 100.0, "elapsed_time": "1:11:26", "remaining_time": "0:00:00"}
|