sedrickkeh commited on
Commit
b64f213
·
verified ·
1 Parent(s): 6f6cfb0

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af6115a97d02a158fec5b5f71d4d66751ae1c61dae552e4eefa6d43d68698ed9
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f00143a457e487dc3a8136d9951e0fbdb0130909354b14a3f56fcda7144b4d4
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aaafe5e96ff1b31bc808822c5dda6d1a06ac65659790416903614d5b096b0c87
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7a66d3abf53027e899a6076707d1c9ffbcaaa3ad7abc247d4a3cbdd40358d2a
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:093f923db1014287794687550c81a9ee1ae6e1af64084d39e8bf08cad212ae8d
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20a11f1eb2fb64185869ae5b9ddcb9a41ce763e802108a6af2c7e8bc3fc65f23
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d59607569af98afff6e6598a2d37dc4535336af57565f8ff93d6d75b419e7be8
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11f0e0fcf1148a1192ff646fe2a7da68b642dc45e546a750b84521863bed3e6b
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -23,3 +23,9 @@
23
  {"current_steps": 23, "total_steps": 30, "loss": 0.8038, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:09:10", "remaining_time": "0:02:47"}
24
  {"current_steps": 24, "total_steps": 30, "loss": 0.7889, "lr": 1.1697777844051105e-06, "epoch": 2.2857142857142856, "percentage": 80.0, "elapsed_time": "0:09:29", "remaining_time": "0:02:22"}
25
  {"current_steps": 25, "total_steps": 30, "loss": 0.8067, "lr": 8.225609429353187e-07, "epoch": 2.380952380952381, "percentage": 83.33, "elapsed_time": "0:09:46", "remaining_time": "0:01:57"}
 
 
 
 
 
 
 
23
  {"current_steps": 23, "total_steps": 30, "loss": 0.8038, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:09:10", "remaining_time": "0:02:47"}
24
  {"current_steps": 24, "total_steps": 30, "loss": 0.7889, "lr": 1.1697777844051105e-06, "epoch": 2.2857142857142856, "percentage": 80.0, "elapsed_time": "0:09:29", "remaining_time": "0:02:22"}
25
  {"current_steps": 25, "total_steps": 30, "loss": 0.8067, "lr": 8.225609429353187e-07, "epoch": 2.380952380952381, "percentage": 83.33, "elapsed_time": "0:09:46", "remaining_time": "0:01:57"}
26
+ {"current_steps": 26, "total_steps": 30, "loss": 0.8279, "lr": 5.318367983829393e-07, "epoch": 2.4761904761904763, "percentage": 86.67, "elapsed_time": "0:10:06", "remaining_time": "0:01:33"}
27
+ {"current_steps": 27, "total_steps": 30, "loss": 0.7699, "lr": 3.015368960704584e-07, "epoch": 2.571428571428571, "percentage": 90.0, "elapsed_time": "0:10:20", "remaining_time": "0:01:08"}
28
+ {"current_steps": 28, "total_steps": 30, "loss": 0.7895, "lr": 1.3477564710088097e-07, "epoch": 2.6666666666666665, "percentage": 93.33, "elapsed_time": "0:10:42", "remaining_time": "0:00:45"}
29
+ {"current_steps": 29, "total_steps": 30, "loss": 0.8391, "lr": 3.3808211290284886e-08, "epoch": 2.761904761904762, "percentage": 96.67, "elapsed_time": "0:11:01", "remaining_time": "0:00:22"}
30
+ {"current_steps": 30, "total_steps": 30, "loss": 0.767, "lr": 0.0, "epoch": 2.857142857142857, "percentage": 100.0, "elapsed_time": "0:11:20", "remaining_time": "0:00:00"}
31
+ {"current_steps": 30, "total_steps": 30, "epoch": 2.857142857142857, "percentage": 100.0, "elapsed_time": "0:13:04", "remaining_time": "0:00:00"}