sedrickkeh commited on
Commit
d67ec46
·
verified ·
1 Parent(s): a0aaf69

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c7769dc968fbfe4c6430594fa2937fb10a1651a35b250ac35a0e928aafb925c
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aac06ac3245c40add09c6b9ac5546cf12f2a11dab2b219df6b4883087c68e758
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c169681f94d906e79fc39e42397fda2436c48cfde94040beebaa956ffd5f4178
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1101b5f347b71f407e76292444c4a5f9f54d84e91fecc380b1ceb00fb392e3b5
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e641b74c9b89270891a37f86ae397ca2b2c2c68a8ab25deb2ace062a325cb22
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c29702af94b4100cb5cf273f3309918b982f8fa4c2e72b217526c1bb81b00e2
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:933b30d6692dc14502c7014498e882b80e48a5ce57cd090f4248173e341db53c
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66e0f3cbf07530c22d4b75cba1444c47d089cf759bd4c7edba5e7eb20f445ff6
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -2,3 +2,7 @@
2
  {"current_steps": 20, "total_steps": 96, "loss": 0.6358, "lr": 5e-06, "epoch": 0.6106870229007634, "percentage": 20.83, "elapsed_time": "0:10:51", "remaining_time": "0:41:15"}
3
  {"current_steps": 30, "total_steps": 96, "loss": 0.5846, "lr": 5e-06, "epoch": 0.916030534351145, "percentage": 31.25, "elapsed_time": "0:16:12", "remaining_time": "0:35:40"}
4
  {"current_steps": 32, "total_steps": 96, "eval_loss": 0.5693601965904236, "epoch": 0.9770992366412213, "percentage": 33.33, "elapsed_time": "0:18:04", "remaining_time": "0:36:08"}
 
 
 
 
 
2
  {"current_steps": 20, "total_steps": 96, "loss": 0.6358, "lr": 5e-06, "epoch": 0.6106870229007634, "percentage": 20.83, "elapsed_time": "0:10:51", "remaining_time": "0:41:15"}
3
  {"current_steps": 30, "total_steps": 96, "loss": 0.5846, "lr": 5e-06, "epoch": 0.916030534351145, "percentage": 31.25, "elapsed_time": "0:16:12", "remaining_time": "0:35:40"}
4
  {"current_steps": 32, "total_steps": 96, "eval_loss": 0.5693601965904236, "epoch": 0.9770992366412213, "percentage": 33.33, "elapsed_time": "0:18:04", "remaining_time": "0:36:08"}
5
+ {"current_steps": 40, "total_steps": 96, "loss": 0.5516, "lr": 5e-06, "epoch": 1.2213740458015268, "percentage": 41.67, "elapsed_time": "0:23:10", "remaining_time": "0:32:26"}
6
+ {"current_steps": 50, "total_steps": 96, "loss": 0.5098, "lr": 5e-06, "epoch": 1.5267175572519083, "percentage": 52.08, "elapsed_time": "0:28:31", "remaining_time": "0:26:14"}
7
+ {"current_steps": 60, "total_steps": 96, "loss": 0.4986, "lr": 5e-06, "epoch": 1.83206106870229, "percentage": 62.5, "elapsed_time": "0:33:52", "remaining_time": "0:20:19"}
8
+ {"current_steps": 65, "total_steps": 96, "eval_loss": 0.5270054340362549, "epoch": 1.984732824427481, "percentage": 67.71, "elapsed_time": "0:37:06", "remaining_time": "0:17:41"}