EtashGuha commited on
Commit
b707712
·
verified ·
1 Parent(s): 8146de6

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1a672655c00e411f8a6b77168ea274acd442e2e57c27f37c46a283d390cd557
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c411998f5aa13b167b4169ea6693741dc84d7361c709b2bb63913c2c63899bc0
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09f98d46a633dc0111f3bf3fd42d048e9371331a5a1256f8e7bdac6edd1d253a
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2816be7f943abf8c7a9a381acb1547de648e60fa475348847826d79da4c60aa
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a69bd72ae63557f31959f2b43f72f3491c1992d00a95afa721893942ceff1638
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82d564947c65b123ef63cb7a39cb143934bf4c4ca0f50d209ba1b0033d8d9e02
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5952e3a690e18b99a1acf735d38fd2084142fdaced8db9b642baa7a94def9c85
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87eae362bfd33a24c49a6d745e6d16c1d922e9186fbd9b8f5381ed8432d87453
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -3,3 +3,7 @@
3
  {"current_steps": 30, "total_steps": 114, "loss": 1.0172, "lr": 5e-06, "epoch": 0.7704654895666132, "percentage": 26.32, "elapsed_time": "1:17:59", "remaining_time": "3:38:21"}
4
  {"current_steps": 38, "total_steps": 114, "eval_loss": 0.996041476726532, "epoch": 0.9759229534510433, "percentage": 33.33, "elapsed_time": "1:43:11", "remaining_time": "3:26:22"}
5
  {"current_steps": 40, "total_steps": 114, "loss": 0.9942, "lr": 5e-06, "epoch": 1.0272873194221508, "percentage": 35.09, "elapsed_time": "1:47:21", "remaining_time": "3:18:36"}
 
 
 
 
 
3
  {"current_steps": 30, "total_steps": 114, "loss": 1.0172, "lr": 5e-06, "epoch": 0.7704654895666132, "percentage": 26.32, "elapsed_time": "1:17:59", "remaining_time": "3:38:21"}
4
  {"current_steps": 38, "total_steps": 114, "eval_loss": 0.996041476726532, "epoch": 0.9759229534510433, "percentage": 33.33, "elapsed_time": "1:43:11", "remaining_time": "3:26:22"}
5
  {"current_steps": 40, "total_steps": 114, "loss": 0.9942, "lr": 5e-06, "epoch": 1.0272873194221508, "percentage": 35.09, "elapsed_time": "1:47:21", "remaining_time": "3:18:36"}
6
+ {"current_steps": 50, "total_steps": 114, "loss": 0.9489, "lr": 5e-06, "epoch": 1.2841091492776886, "percentage": 43.86, "elapsed_time": "2:13:17", "remaining_time": "2:50:37"}
7
+ {"current_steps": 60, "total_steps": 114, "loss": 0.9348, "lr": 5e-06, "epoch": 1.5409309791332264, "percentage": 52.63, "elapsed_time": "2:39:13", "remaining_time": "2:23:18"}
8
+ {"current_steps": 70, "total_steps": 114, "loss": 0.9304, "lr": 5e-06, "epoch": 1.797752808988764, "percentage": 61.4, "elapsed_time": "3:05:10", "remaining_time": "1:56:23"}
9
+ {"current_steps": 77, "total_steps": 114, "eval_loss": 0.9520364999771118, "epoch": 1.9775280898876404, "percentage": 67.54, "elapsed_time": "3:27:36", "remaining_time": "1:39:45"}