sedrickkeh commited on
Commit
a3ea2a1
·
verified ·
1 Parent(s): 35e3339

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ccc6562e39b1aef1f3c8393b76942e5217e02b25371469a934cfb2576505707
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1d3b6f1d26d70b32bd690ea723f7285630fc85fd9de61ff2e08e860b0b6bad1
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99a792725e77604dc6393b772a2ee4bde9f08701908c4dd58f8b08f6607eedbf
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80ffce1f241a0b536689d65dbcc7108256c00e973ec986af2321c53369120623
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3cfab223a4ddc4c74dadfaa08d160f23640a7a13ef06dd4ab5a1a907e45c0676
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71aeaa957f88479af7c27b53efd60e2df95a117803180d6b77e51ace5f1fda91
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f66779a616603967f41d59f299b84b1ed4855b75ec52408439d54d1dd7ed656e
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e107e1af5d4f759da5e1e45249a96f8bff5f48a9f386e4d6619d5397beacdae5
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -1,3 +1,7 @@
1
  {"current_steps": 10, "total_steps": 69, "loss": 1.0642, "lr": 5e-06, "epoch": 0.42328042328042326, "percentage": 14.49, "elapsed_time": "0:05:23", "remaining_time": "0:31:48"}
2
  {"current_steps": 20, "total_steps": 69, "loss": 0.9362, "lr": 5e-06, "epoch": 0.8465608465608465, "percentage": 28.99, "elapsed_time": "0:10:38", "remaining_time": "0:26:03"}
3
  {"current_steps": 23, "total_steps": 69, "eval_loss": 0.9042366743087769, "epoch": 0.9735449735449735, "percentage": 33.33, "elapsed_time": "0:12:42", "remaining_time": "0:25:24"}
 
 
 
 
 
1
  {"current_steps": 10, "total_steps": 69, "loss": 1.0642, "lr": 5e-06, "epoch": 0.42328042328042326, "percentage": 14.49, "elapsed_time": "0:05:23", "remaining_time": "0:31:48"}
2
  {"current_steps": 20, "total_steps": 69, "loss": 0.9362, "lr": 5e-06, "epoch": 0.8465608465608465, "percentage": 28.99, "elapsed_time": "0:10:38", "remaining_time": "0:26:03"}
3
  {"current_steps": 23, "total_steps": 69, "eval_loss": 0.9042366743087769, "epoch": 0.9735449735449735, "percentage": 33.33, "elapsed_time": "0:12:42", "remaining_time": "0:25:24"}
4
+ {"current_steps": 30, "total_steps": 69, "loss": 0.9376, "lr": 5e-06, "epoch": 1.2804232804232805, "percentage": 43.48, "elapsed_time": "0:17:25", "remaining_time": "0:22:39"}
5
+ {"current_steps": 40, "total_steps": 69, "loss": 0.8478, "lr": 5e-06, "epoch": 1.7037037037037037, "percentage": 57.97, "elapsed_time": "0:22:41", "remaining_time": "0:16:26"}
6
+ {"current_steps": 46, "total_steps": 69, "eval_loss": 0.8493698835372925, "epoch": 1.9576719576719577, "percentage": 66.67, "elapsed_time": "0:26:26", "remaining_time": "0:13:13"}
7
+ {"current_steps": 50, "total_steps": 69, "loss": 0.8658, "lr": 5e-06, "epoch": 2.1375661375661377, "percentage": 72.46, "elapsed_time": "0:29:30", "remaining_time": "0:11:12"}