sedrickkeh
commited on
Commit
•
d44228b
1
Parent(s):
2dcb519
Training in progress, epoch 3
Browse files
model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943162336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0ea6043cebfee3301f84b0329d5b6008cee00e17a2118c245f297796a01f362
|
3 |
size 4943162336
|
model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999819336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:821ebfbe647374371a089bc87008cf9f065d4e66cf63d76466fcc037b4687c01
|
3 |
size 4999819336
|
model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4540516344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:156a99fdce4affcf667c8a879a2d04e3f199b3b4c5e15cfdd6617349ed401725
|
3 |
size 4540516344
|
trainer_log.jsonl
CHANGED
@@ -33,3 +33,20 @@
|
|
33 |
{"current_steps": 320, "total_steps": 504, "loss": 0.4338, "lr": 1.9539255805556346e-06, "epoch": 1.9047619047619047, "percentage": 63.49, "elapsed_time": "5:11:56", "remaining_time": "2:59:22"}
|
34 |
{"current_steps": 330, "total_steps": 504, "loss": 0.4333, "lr": 1.7764836446824835e-06, "epoch": 1.9642857142857144, "percentage": 65.48, "elapsed_time": "5:21:34", "remaining_time": "2:49:33"}
|
35 |
{"current_steps": 336, "total_steps": 504, "eval_loss": 0.05795557424426079, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "5:30:16", "remaining_time": "2:45:08"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
{"current_steps": 320, "total_steps": 504, "loss": 0.4338, "lr": 1.9539255805556346e-06, "epoch": 1.9047619047619047, "percentage": 63.49, "elapsed_time": "5:11:56", "remaining_time": "2:59:22"}
|
34 |
{"current_steps": 330, "total_steps": 504, "loss": 0.4333, "lr": 1.7764836446824835e-06, "epoch": 1.9642857142857144, "percentage": 65.48, "elapsed_time": "5:21:34", "remaining_time": "2:49:33"}
|
35 |
{"current_steps": 336, "total_steps": 504, "eval_loss": 0.05795557424426079, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "5:30:16", "remaining_time": "2:45:08"}
|
36 |
+
{"current_steps": 340, "total_steps": 504, "loss": 0.414, "lr": 1.6029381269821607e-06, "epoch": 2.0238095238095237, "percentage": 67.46, "elapsed_time": "5:34:54", "remaining_time": "2:41:32"}
|
37 |
+
{"current_steps": 350, "total_steps": 504, "loss": 0.3888, "lr": 1.4342236378529106e-06, "epoch": 2.0833333333333335, "percentage": 69.44, "elapsed_time": "5:44:32", "remaining_time": "2:31:35"}
|
38 |
+
{"current_steps": 360, "total_steps": 504, "loss": 0.3841, "lr": 1.2712487707171645e-06, "epoch": 2.142857142857143, "percentage": 71.43, "elapsed_time": "5:54:10", "remaining_time": "2:21:40"}
|
39 |
+
{"current_steps": 370, "total_steps": 504, "loss": 0.3837, "lr": 1.1148912088910687e-06, "epoch": 2.2023809523809526, "percentage": 73.41, "elapsed_time": "6:03:47", "remaining_time": "2:11:45"}
|
40 |
+
{"current_steps": 380, "total_steps": 504, "loss": 0.3863, "lr": 9.659929989170156e-07, "epoch": 2.261904761904762, "percentage": 75.4, "elapsed_time": "6:13:25", "remaining_time": "2:01:51"}
|
41 |
+
{"current_steps": 390, "total_steps": 504, "loss": 0.3825, "lr": 8.253560158141111e-07, "epoch": 2.3214285714285716, "percentage": 77.38, "elapsed_time": "6:23:02", "remaining_time": "1:51:58"}
|
42 |
+
{"current_steps": 400, "total_steps": 504, "loss": 0.3817, "lr": 6.93737644667995e-07, "epoch": 2.380952380952381, "percentage": 79.37, "elapsed_time": "6:32:40", "remaining_time": "1:42:05"}
|
43 |
+
{"current_steps": 410, "total_steps": 504, "loss": 0.3816, "lr": 5.718467018163243e-07, "epoch": 2.4404761904761907, "percentage": 81.35, "elapsed_time": "6:42:18", "remaining_time": "1:32:14"}
|
44 |
+
{"current_steps": 420, "total_steps": 504, "loss": 0.3815, "lr": 4.6033961759594045e-07, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "6:51:56", "remaining_time": "1:22:23"}
|
45 |
+
{"current_steps": 430, "total_steps": 504, "loss": 0.3829, "lr": 3.598169012091049e-07, "epoch": 2.5595238095238093, "percentage": 85.32, "elapsed_time": "7:01:34", "remaining_time": "1:12:32"}
|
46 |
+
{"current_steps": 440, "total_steps": 504, "loss": 0.3837, "lr": 2.708199067468939e-07, "epoch": 2.619047619047619, "percentage": 87.3, "elapsed_time": "7:11:12", "remaining_time": "1:02:43"}
|
47 |
+
{"current_steps": 450, "total_steps": 504, "loss": 0.3818, "lr": 1.9382791778596864e-07, "epoch": 2.678571428571429, "percentage": 89.29, "elapsed_time": "7:20:50", "remaining_time": "0:52:54"}
|
48 |
+
{"current_steps": 460, "total_steps": 504, "loss": 0.3828, "lr": 1.2925556625931174e-07, "epoch": 2.738095238095238, "percentage": 91.27, "elapsed_time": "7:30:28", "remaining_time": "0:43:05"}
|
49 |
+
{"current_steps": 470, "total_steps": 504, "loss": 0.3819, "lr": 7.7450599501315e-08, "epoch": 2.7976190476190474, "percentage": 93.25, "elapsed_time": "7:40:06", "remaining_time": "0:33:17"}
|
50 |
+
{"current_steps": 480, "total_steps": 504, "loss": 0.3815, "lr": 3.869200749255703e-08, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "7:49:43", "remaining_time": "0:23:29"}
|
51 |
+
{"current_steps": 490, "total_steps": 504, "loss": 0.3791, "lr": 1.3188520389787462e-08, "epoch": 2.9166666666666665, "percentage": 97.22, "elapsed_time": "7:59:21", "remaining_time": "0:13:41"}
|
52 |
+
{"current_steps": 500, "total_steps": 504, "loss": 0.3811, "lr": 1.0774844325039946e-09, "epoch": 2.9761904761904763, "percentage": 99.21, "elapsed_time": "8:08:59", "remaining_time": "0:03:54"}
|