sedrickkeh commited on
Commit
6bcd906
·
verified ·
1 Parent(s): 909223e

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18c6cc5143950218296edee363116fe65483ff2ffeb047b334fa81b585fbc42b
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d54d3b4301b8f5636cc261314bc05f706d4356671582a13edadb08b9a704c544
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7403d16850012dca74da4a6be86a3862349191cfedd15a67def224e0a32fb9b
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72d8925558b37d4d6fc5b1481a614952a6b7a13dfc9a9a33fc21edcf0bee7d23
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a52d6a05c07827c0f52a53adee1d842e9556a27744575bfeff66a3f300459f8a
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef57aed79f7e28685664bc13cdb588919866006c07d97a57f6d4aefca734807d
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fbeb659986f9abe160ab0dc10b221884f8f8a809859aadb2f69488c66fe4301
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b97b4c07b00a0f449fdc5e7a70bb6d710a14fa6998c90bb56045f1a606a1602
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -23,3 +23,9 @@
23
  {"current_steps": 23, "total_steps": 30, "loss": 0.6867, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:17:14", "remaining_time": "0:05:14"}
24
  {"current_steps": 24, "total_steps": 30, "loss": 0.7336, "lr": 1.1697777844051105e-06, "epoch": 2.2857142857142856, "percentage": 80.0, "elapsed_time": "0:17:47", "remaining_time": "0:04:26"}
25
  {"current_steps": 25, "total_steps": 30, "loss": 0.8412, "lr": 8.225609429353187e-07, "epoch": 2.380952380952381, "percentage": 83.33, "elapsed_time": "0:18:36", "remaining_time": "0:03:43"}
 
 
 
 
 
 
 
23
  {"current_steps": 23, "total_steps": 30, "loss": 0.6867, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:17:14", "remaining_time": "0:05:14"}
24
  {"current_steps": 24, "total_steps": 30, "loss": 0.7336, "lr": 1.1697777844051105e-06, "epoch": 2.2857142857142856, "percentage": 80.0, "elapsed_time": "0:17:47", "remaining_time": "0:04:26"}
25
  {"current_steps": 25, "total_steps": 30, "loss": 0.8412, "lr": 8.225609429353187e-07, "epoch": 2.380952380952381, "percentage": 83.33, "elapsed_time": "0:18:36", "remaining_time": "0:03:43"}
26
+ {"current_steps": 26, "total_steps": 30, "loss": 0.7218, "lr": 5.318367983829393e-07, "epoch": 2.4761904761904763, "percentage": 86.67, "elapsed_time": "0:19:12", "remaining_time": "0:02:57"}
27
+ {"current_steps": 27, "total_steps": 30, "loss": 0.7787, "lr": 3.015368960704584e-07, "epoch": 2.571428571428571, "percentage": 90.0, "elapsed_time": "0:20:01", "remaining_time": "0:02:13"}
28
+ {"current_steps": 28, "total_steps": 30, "loss": 0.8023, "lr": 1.3477564710088097e-07, "epoch": 2.6666666666666665, "percentage": 93.33, "elapsed_time": "0:20:38", "remaining_time": "0:01:28"}
29
+ {"current_steps": 29, "total_steps": 30, "loss": 0.7005, "lr": 3.3808211290284886e-08, "epoch": 2.761904761904762, "percentage": 96.67, "elapsed_time": "0:21:12", "remaining_time": "0:00:43"}
30
+ {"current_steps": 30, "total_steps": 30, "loss": 0.7909, "lr": 0.0, "epoch": 2.857142857142857, "percentage": 100.0, "elapsed_time": "0:22:03", "remaining_time": "0:00:00"}
31
+ {"current_steps": 30, "total_steps": 30, "epoch": 2.857142857142857, "percentage": 100.0, "elapsed_time": "0:23:44", "remaining_time": "0:00:00"}