sedrickkeh commited on
Commit
909223e
·
verified ·
1 Parent(s): f23abb2

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b767177671a88725a2c2af492fb3c09ae0388e18a6a9885e4f42d246e511c0c
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18c6cc5143950218296edee363116fe65483ff2ffeb047b334fa81b585fbc42b
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81691fbe51ca46074db7cb9b8cbfe840fe01681740946f007f3b2f0712a49377
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7403d16850012dca74da4a6be86a3862349191cfedd15a67def224e0a32fb9b
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9582eec4559946641114f0403c57e9cbf81d4dce1ebbd43d42df8b5a04421037
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a52d6a05c07827c0f52a53adee1d842e9556a27744575bfeff66a3f300459f8a
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc95e64ef9c757c92f55986df57210fbd4d62e634fa1e78a29161a8ff116b954
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fbeb659986f9abe160ab0dc10b221884f8f8a809859aadb2f69488c66fe4301
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -13,3 +13,13 @@
13
  {"current_steps": 13, "total_steps": 30, "loss": 0.7946, "lr": 6.980398830195785e-06, "epoch": 1.2380952380952381, "percentage": 43.33, "elapsed_time": "0:09:33", "remaining_time": "0:12:29"}
14
  {"current_steps": 14, "total_steps": 30, "loss": 0.8539, "lr": 6.434016163555452e-06, "epoch": 1.3333333333333333, "percentage": 46.67, "elapsed_time": "0:10:04", "remaining_time": "0:11:30"}
15
  {"current_steps": 15, "total_steps": 30, "loss": 0.7039, "lr": 5.8682408883346535e-06, "epoch": 1.4285714285714286, "percentage": 50.0, "elapsed_time": "0:10:37", "remaining_time": "0:10:37"}
 
 
 
 
 
 
 
 
 
 
 
13
  {"current_steps": 13, "total_steps": 30, "loss": 0.7946, "lr": 6.980398830195785e-06, "epoch": 1.2380952380952381, "percentage": 43.33, "elapsed_time": "0:09:33", "remaining_time": "0:12:29"}
14
  {"current_steps": 14, "total_steps": 30, "loss": 0.8539, "lr": 6.434016163555452e-06, "epoch": 1.3333333333333333, "percentage": 46.67, "elapsed_time": "0:10:04", "remaining_time": "0:11:30"}
15
  {"current_steps": 15, "total_steps": 30, "loss": 0.7039, "lr": 5.8682408883346535e-06, "epoch": 1.4285714285714286, "percentage": 50.0, "elapsed_time": "0:10:37", "remaining_time": "0:10:37"}
16
+ {"current_steps": 16, "total_steps": 30, "loss": 0.8027, "lr": 5.290724144552379e-06, "epoch": 1.5238095238095237, "percentage": 53.33, "elapsed_time": "0:11:07", "remaining_time": "0:09:44"}
17
+ {"current_steps": 17, "total_steps": 30, "loss": 0.8275, "lr": 4.7092758554476215e-06, "epoch": 1.619047619047619, "percentage": 56.67, "elapsed_time": "0:12:00", "remaining_time": "0:09:10"}
18
+ {"current_steps": 18, "total_steps": 30, "loss": 0.9132, "lr": 4.131759111665349e-06, "epoch": 1.7142857142857144, "percentage": 60.0, "elapsed_time": "0:12:49", "remaining_time": "0:08:32"}
19
+ {"current_steps": 19, "total_steps": 30, "loss": 0.7173, "lr": 3.5659838364445505e-06, "epoch": 1.8095238095238095, "percentage": 63.33, "elapsed_time": "0:13:41", "remaining_time": "0:07:55"}
20
+ {"current_steps": 20, "total_steps": 30, "loss": 0.856, "lr": 3.019601169804216e-06, "epoch": 1.9047619047619047, "percentage": 66.67, "elapsed_time": "0:14:26", "remaining_time": "0:07:13"}
21
+ {"current_steps": 21, "total_steps": 30, "loss": 1.0468, "lr": 2.5000000000000015e-06, "epoch": 2.0, "percentage": 70.0, "elapsed_time": "0:15:07", "remaining_time": "0:06:29"}
22
+ {"current_steps": 22, "total_steps": 30, "loss": 0.7511, "lr": 2.0142070414860704e-06, "epoch": 2.0952380952380953, "percentage": 73.33, "elapsed_time": "0:16:45", "remaining_time": "0:06:05"}
23
+ {"current_steps": 23, "total_steps": 30, "loss": 0.6867, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:17:14", "remaining_time": "0:05:14"}
24
+ {"current_steps": 24, "total_steps": 30, "loss": 0.7336, "lr": 1.1697777844051105e-06, "epoch": 2.2857142857142856, "percentage": 80.0, "elapsed_time": "0:17:47", "remaining_time": "0:04:26"}
25
+ {"current_steps": 25, "total_steps": 30, "loss": 0.8412, "lr": 8.225609429353187e-07, "epoch": 2.380952380952381, "percentage": 83.33, "elapsed_time": "0:18:36", "remaining_time": "0:03:43"}