sedrickkeh commited on
Commit
cb2eb0d
·
verified ·
1 Parent(s): 6d84d6a

Training in progress, epoch 3

Browse files
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9417b453399d0235105a83665b67045dd503aa50eab1effd0644941cc3c804e7
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ff1a32cb551c4675893cfe7e45671b524ded51f041652b3367bb0464908e43a
3
  size 4943162336
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5c799f2568510d70dd519baed48d76eb4deedc38daa177e939bafe870201e76
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a646efd25dcd35ca63745c9cc912f25f4851b982fdf2e5bf5ab43a8133da47a
3
  size 4999819336
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a03fd8a37311abf1dad64132e13335dc935cd793d0947621f4aa774d7f3b42e
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5af9a1db0b8edec62c3d5c01c415d95e125a776470c625fe00830c0ae6c54950
3
  size 4540516344
trainer_log.jsonl CHANGED
@@ -33,3 +33,20 @@
33
  {"current_steps": 320, "total_steps": 504, "loss": 0.4195, "lr": 1.9542666212969685e-06, "epoch": 1.9047619047619047, "percentage": 63.49, "elapsed_time": "2:56:52", "remaining_time": "1:41:41"}
34
  {"current_steps": 330, "total_steps": 504, "loss": 0.4198, "lr": 1.817762612003957e-06, "epoch": 1.9642857142857144, "percentage": 65.48, "elapsed_time": "3:02:17", "remaining_time": "1:36:07"}
35
  {"current_steps": 336, "total_steps": 504, "eval_loss": 0.05766107514500618, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:07:28", "remaining_time": "1:33:44"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  {"current_steps": 320, "total_steps": 504, "loss": 0.4195, "lr": 1.9542666212969685e-06, "epoch": 1.9047619047619047, "percentage": 63.49, "elapsed_time": "2:56:52", "remaining_time": "1:41:41"}
34
  {"current_steps": 330, "total_steps": 504, "loss": 0.4198, "lr": 1.817762612003957e-06, "epoch": 1.9642857142857144, "percentage": 65.48, "elapsed_time": "3:02:17", "remaining_time": "1:36:07"}
35
  {"current_steps": 336, "total_steps": 504, "eval_loss": 0.05766107514500618, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:07:28", "remaining_time": "1:33:44"}
36
+ {"current_steps": 340, "total_steps": 504, "loss": 0.4022, "lr": 1.6852840498821444e-06, "epoch": 2.0238095238095237, "percentage": 67.46, "elapsed_time": "3:10:29", "remaining_time": "1:31:53"}
37
+ {"current_steps": 350, "total_steps": 504, "loss": 0.3793, "lr": 1.5574029839182003e-06, "epoch": 2.0833333333333335, "percentage": 69.44, "elapsed_time": "3:15:56", "remaining_time": "1:26:12"}
38
+ {"current_steps": 360, "total_steps": 504, "loss": 0.3754, "lr": 1.4346716108828857e-06, "epoch": 2.142857142857143, "percentage": 71.43, "elapsed_time": "3:21:21", "remaining_time": "1:20:32"}
39
+ {"current_steps": 370, "total_steps": 504, "loss": 0.3752, "lr": 1.317619890918075e-06, "epoch": 2.2023809523809526, "percentage": 73.41, "elapsed_time": "3:26:46", "remaining_time": "1:14:53"}
40
+ {"current_steps": 380, "total_steps": 504, "loss": 0.3781, "lr": 1.2067532591426361e-06, "epoch": 2.261904761904762, "percentage": 75.4, "elapsed_time": "3:32:14", "remaining_time": "1:09:15"}
41
+ {"current_steps": 390, "total_steps": 504, "loss": 0.3747, "lr": 1.1025504431585827e-06, "epoch": 2.3214285714285716, "percentage": 77.38, "elapsed_time": "3:37:41", "remaining_time": "1:03:37"}
42
+ {"current_steps": 400, "total_steps": 504, "loss": 0.3739, "lr": 1.0054613958815923e-06, "epoch": 2.380952380952381, "percentage": 79.37, "elapsed_time": "3:43:06", "remaining_time": "0:58:00"}
43
+ {"current_steps": 410, "total_steps": 504, "loss": 0.3739, "lr": 9.159053526220585e-07, "epoch": 2.4404761904761907, "percentage": 81.35, "elapsed_time": "3:48:32", "remaining_time": "0:52:23"}
44
+ {"current_steps": 420, "total_steps": 504, "loss": 0.3742, "lr": 8.342690208062692e-07, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "3:53:58", "remaining_time": "0:46:47"}
45
+ {"current_steps": 430, "total_steps": 504, "loss": 0.3756, "lr": 7.609049101546112e-07, "epoch": 2.5595238095238093, "percentage": 85.32, "elapsed_time": "3:59:26", "remaining_time": "0:41:12"}
46
+ {"current_steps": 440, "total_steps": 504, "loss": 0.3763, "lr": 6.961298105271477e-07, "epoch": 2.619047619047619, "percentage": 87.3, "elapsed_time": "4:04:51", "remaining_time": "0:35:36"}
47
+ {"current_steps": 450, "total_steps": 504, "loss": 0.3745, "lr": 6.40223424009332e-07, "epoch": 2.678571428571429, "percentage": 89.29, "elapsed_time": "4:10:17", "remaining_time": "0:30:02"}
48
+ {"current_steps": 460, "total_steps": 504, "loss": 0.3754, "lr": 5.9342715714456e-07, "epoch": 2.738095238095238, "percentage": 91.27, "elapsed_time": "4:15:44", "remaining_time": "0:24:27"}
49
+ {"current_steps": 470, "total_steps": 504, "loss": 0.3745, "lr": 5.559430785287691e-07, "epoch": 2.7976190476190474, "percentage": 93.25, "elapsed_time": "4:21:09", "remaining_time": "0:18:53"}
50
+ {"current_steps": 480, "total_steps": 504, "loss": 0.3739, "lr": 5.27933046268245e-07, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "4:26:35", "remaining_time": "0:13:19"}
51
+ {"current_steps": 490, "total_steps": 504, "loss": 0.3713, "lr": 5.095180090683062e-07, "epoch": 2.9166666666666665, "percentage": 97.22, "elapsed_time": "4:32:00", "remaining_time": "0:07:46"}
52
+ {"current_steps": 500, "total_steps": 504, "loss": 0.3732, "lr": 5.007774839708124e-07, "epoch": 2.9761904761904763, "percentage": 99.21, "elapsed_time": "4:37:25", "remaining_time": "0:02:13"}