esfrankel17 commited on
Commit
1a6bef9
·
verified ·
1 Parent(s): 918f4cd

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80e898f686f91ca0491b32e277bfca0b81304d4522d569fe7481c19983dadd6d
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa7ddf40a53c01580113b725a0016eec9561e858e589517f9d83205265478d6b
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebde098b486f203fd01e807c2b6b0a84097d7212c0411c8a88f9e9fa8c651d74
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d362d83c2e9ba973e98cca23893617dd1bf3577389c0af075b784abd7f877f9d
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:723649201ed03575b92401a56585ed80868e56ccedd76a17987321cdadcc3692
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55b0d48a0edc756a4f62d053427ec9337fc67951899617d08adfc913344f0caa
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:482a33cd7718fe720f2f5641f13b3e589a85fbbe00478c2ec8bee820c7b59aff
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b229c76dc68a962cfcf861b4b833add51f486c85f418864f20b6ce72b2e7d061
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -1,2 +1,6 @@
1
  {"current_steps": 1, "total_steps": 3, "loss": 1.9079, "learning_rate": 5e-06, "epoch": 0.5333333333333333, "percentage": 33.33, "elapsed_time": "0:05:58", "remaining_time": "0:11:56"}
2
  {"current_steps": 1, "total_steps": 3, "eval_loss": 1.8345922231674194, "epoch": 0.5333333333333333, "percentage": 33.33, "elapsed_time": "0:11:21", "remaining_time": "0:22:42"}
 
 
 
 
 
1
  {"current_steps": 1, "total_steps": 3, "loss": 1.9079, "learning_rate": 5e-06, "epoch": 0.5333333333333333, "percentage": 33.33, "elapsed_time": "0:05:58", "remaining_time": "0:11:56"}
2
  {"current_steps": 1, "total_steps": 3, "eval_loss": 1.8345922231674194, "epoch": 0.5333333333333333, "percentage": 33.33, "elapsed_time": "0:11:21", "remaining_time": "0:22:42"}
3
+ {"current_steps": 2, "total_steps": 3, "loss": 1.8231, "learning_rate": 5e-06, "epoch": 1.0666666666666667, "percentage": 66.67, "elapsed_time": "0:13:18", "remaining_time": "0:06:39"}
4
+ {"current_steps": 3, "total_steps": 3, "loss": 1.7235, "learning_rate": 5e-06, "epoch": 1.6, "percentage": 100.0, "elapsed_time": "0:19:12", "remaining_time": "0:00:00"}
5
+ {"current_steps": 3, "total_steps": 3, "eval_loss": 1.7085474729537964, "epoch": 1.6, "percentage": 100.0, "elapsed_time": "0:20:38", "remaining_time": "0:00:00"}
6
+ {"current_steps": 3, "total_steps": 3, "epoch": 1.6, "percentage": 100.0, "elapsed_time": "0:21:23", "remaining_time": "0:00:00"}