Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1ec2e19611e728c2204c2059d4248158afe3c29ecf6f88fe26a7245923b632a
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:834c696f812bcdfc37396741c01533cdc2c1944ecf69a612765a1c37984846a5
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1bbb9a0dbf0e260efac2af325e4ce14e752b322852a0ed7eee2bc71af85fcc7
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70f2f1ba1b3f8e3646ba5ce8a6f21a7320e4e1104e94fc0ecfda28c3bb75bd5d
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -21,3 +21,11 @@
|
|
21 |
{"current_steps": 21, "total_steps": 30, "loss": 1.1522, "lr": 2.5000000000000015e-06, "epoch": 2.0, "percentage": 70.0, "elapsed_time": "0:19:51", "remaining_time": "0:08:30"}
|
22 |
{"current_steps": 22, "total_steps": 30, "loss": 0.7915, "lr": 2.0142070414860704e-06, "epoch": 2.0952380952380953, "percentage": 73.33, "elapsed_time": "0:21:33", "remaining_time": "0:07:50"}
|
23 |
{"current_steps": 23, "total_steps": 30, "loss": 0.8528, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:22:33", "remaining_time": "0:06:52"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
21 |
{"current_steps": 21, "total_steps": 30, "loss": 1.1522, "lr": 2.5000000000000015e-06, "epoch": 2.0, "percentage": 70.0, "elapsed_time": "0:19:51", "remaining_time": "0:08:30"}
|
22 |
{"current_steps": 22, "total_steps": 30, "loss": 0.7915, "lr": 2.0142070414860704e-06, "epoch": 2.0952380952380953, "percentage": 73.33, "elapsed_time": "0:21:33", "remaining_time": "0:07:50"}
|
23 |
{"current_steps": 23, "total_steps": 30, "loss": 0.8528, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:22:33", "remaining_time": "0:06:52"}
|
24 |
+
{"current_steps": 24, "total_steps": 30, "loss": 0.7936, "lr": 1.1697777844051105e-06, "epoch": 2.2857142857142856, "percentage": 80.0, "elapsed_time": "0:23:29", "remaining_time": "0:05:52"}
|
25 |
+
{"current_steps": 25, "total_steps": 30, "loss": 0.7863, "lr": 8.225609429353187e-07, "epoch": 2.380952380952381, "percentage": 83.33, "elapsed_time": "0:24:22", "remaining_time": "0:04:52"}
|
26 |
+
{"current_steps": 26, "total_steps": 30, "loss": 0.7732, "lr": 5.318367983829393e-07, "epoch": 2.4761904761904763, "percentage": 86.67, "elapsed_time": "0:25:09", "remaining_time": "0:03:52"}
|
27 |
+
{"current_steps": 27, "total_steps": 30, "loss": 0.7773, "lr": 3.015368960704584e-07, "epoch": 2.571428571428571, "percentage": 90.0, "elapsed_time": "0:25:59", "remaining_time": "0:02:53"}
|
28 |
+
{"current_steps": 28, "total_steps": 30, "loss": 0.8249, "lr": 1.3477564710088097e-07, "epoch": 2.6666666666666665, "percentage": 93.33, "elapsed_time": "0:27:00", "remaining_time": "0:01:55"}
|
29 |
+
{"current_steps": 29, "total_steps": 30, "loss": 0.7718, "lr": 3.3808211290284886e-08, "epoch": 2.761904761904762, "percentage": 96.67, "elapsed_time": "0:27:58", "remaining_time": "0:00:57"}
|
30 |
+
{"current_steps": 30, "total_steps": 30, "loss": 0.769, "lr": 0.0, "epoch": 2.857142857142857, "percentage": 100.0, "elapsed_time": "0:28:50", "remaining_time": "0:00:00"}
|
31 |
+
{"current_steps": 30, "total_steps": 30, "epoch": 2.857142857142857, "percentage": 100.0, "elapsed_time": "0:30:29", "remaining_time": "0:00:00"}
|