sedrickkeh commited on
Commit
a7a7ed0
·
verified ·
1 Parent(s): 2f082e0

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:111a6145ef043264c34e2185f2b00c9ef40511c367e9bd0d5ba5603746931267
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aabd14eb991de378cec947dec46e2c4fe49a8eb58afc7585ea8dd51f18f41bd0
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dab675c58f7b4fe212f59a98102d3035ad9c59ae7d637101d7b85f96bedffea
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cd2890f1463cfd889f74f1b6e6eabc12fdf867eecf85dad2ddca6ef780cb67c
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b06ae13a8ad49b0e534315e21a0bba809ca9c315a13a1451d65aec81c3596374
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49f54d8dfefb6c6d67acc0e5db8184594389ef5b8b516809e23e02e812766500
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e38a4b60cef0c937ddd2ccd69e16fadad02d04663d7ee7ff56a614bd2ae3e99d
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bd7934a088dc7a4e163013a8d6ef48297394687f828e57a948e7ecd6c158982
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -10,3 +10,14 @@
10
  {"current_steps": 10, "total_steps": 30, "loss": 1.0839, "lr": 8.43120818934367e-06, "epoch": 0.96, "percentage": 33.33, "elapsed_time": "0:09:03", "remaining_time": "0:18:07"}
11
  {"current_steps": 11, "total_steps": 30, "loss": 1.6738, "lr": 7.985792958513932e-06, "epoch": 1.064, "percentage": 36.67, "elapsed_time": "0:11:07", "remaining_time": "0:19:13"}
12
  {"current_steps": 12, "total_steps": 30, "loss": 1.0706, "lr": 7.500000000000001e-06, "epoch": 1.16, "percentage": 40.0, "elapsed_time": "0:12:00", "remaining_time": "0:18:00"}
 
 
 
 
 
 
 
 
 
 
 
 
10
  {"current_steps": 10, "total_steps": 30, "loss": 1.0839, "lr": 8.43120818934367e-06, "epoch": 0.96, "percentage": 33.33, "elapsed_time": "0:09:03", "remaining_time": "0:18:07"}
11
  {"current_steps": 11, "total_steps": 30, "loss": 1.6738, "lr": 7.985792958513932e-06, "epoch": 1.064, "percentage": 36.67, "elapsed_time": "0:11:07", "remaining_time": "0:19:13"}
12
  {"current_steps": 12, "total_steps": 30, "loss": 1.0706, "lr": 7.500000000000001e-06, "epoch": 1.16, "percentage": 40.0, "elapsed_time": "0:12:00", "remaining_time": "0:18:00"}
13
+ {"current_steps": 13, "total_steps": 30, "loss": 1.0189, "lr": 6.980398830195785e-06, "epoch": 1.256, "percentage": 43.33, "elapsed_time": "0:12:51", "remaining_time": "0:16:48"}
14
+ {"current_steps": 14, "total_steps": 30, "loss": 1.028, "lr": 6.434016163555452e-06, "epoch": 1.3519999999999999, "percentage": 46.67, "elapsed_time": "0:13:36", "remaining_time": "0:15:33"}
15
+ {"current_steps": 15, "total_steps": 30, "loss": 0.9001, "lr": 5.8682408883346535e-06, "epoch": 1.448, "percentage": 50.0, "elapsed_time": "0:14:22", "remaining_time": "0:14:22"}
16
+ {"current_steps": 16, "total_steps": 30, "loss": 1.0615, "lr": 5.290724144552379e-06, "epoch": 1.544, "percentage": 53.33, "elapsed_time": "0:15:17", "remaining_time": "0:13:22"}
17
+ {"current_steps": 17, "total_steps": 30, "loss": 0.9473, "lr": 4.7092758554476215e-06, "epoch": 1.6400000000000001, "percentage": 56.67, "elapsed_time": "0:16:10", "remaining_time": "0:12:22"}
18
+ {"current_steps": 18, "total_steps": 30, "loss": 0.9851, "lr": 4.131759111665349e-06, "epoch": 1.736, "percentage": 60.0, "elapsed_time": "0:17:04", "remaining_time": "0:11:23"}
19
+ {"current_steps": 19, "total_steps": 30, "loss": 0.8426, "lr": 3.5659838364445505e-06, "epoch": 1.8319999999999999, "percentage": 63.33, "elapsed_time": "0:17:58", "remaining_time": "0:10:24"}
20
+ {"current_steps": 20, "total_steps": 30, "loss": 1.0051, "lr": 3.019601169804216e-06, "epoch": 1.928, "percentage": 66.67, "elapsed_time": "0:18:57", "remaining_time": "0:09:28"}
21
+ {"current_steps": 21, "total_steps": 30, "loss": 1.6283, "lr": 2.5000000000000015e-06, "epoch": 2.032, "percentage": 70.0, "elapsed_time": "0:21:00", "remaining_time": "0:09:00"}
22
+ {"current_steps": 22, "total_steps": 30, "loss": 0.9316, "lr": 2.0142070414860704e-06, "epoch": 2.128, "percentage": 73.33, "elapsed_time": "0:21:55", "remaining_time": "0:07:58"}
23
+ {"current_steps": 23, "total_steps": 30, "loss": 0.9276, "lr": 1.5687918106563326e-06, "epoch": 2.224, "percentage": 76.67, "elapsed_time": "0:22:49", "remaining_time": "0:06:56"}