ryanmarten commited on
Commit
ada7ed3
·
verified ·
1 Parent(s): 831dd31

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a569a45b5ed09afa9d5d2fe80e71a500ae9592d26c3a2c96eeb70b90e6a6bf4
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a79750c04042df180b1caeef918092bc4458cb1132d521c5d04b0037512585e3
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:601b1ce9c4a3e259446cbda76d8e549a6cc7ec48bf8753328890a555c7d30e25
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f2abd84dfc36332bc902154326085e20edd5d5adb2cce7f1cbcb13afa274b94
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd9ca7cc75d0be88608dea4f97aab24b19ff5985a6fd64f312bf2b4cafed7b52
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9e08a45d404246181a9021eb71829e826c6f3320d1f0abbe1eb7f8e496884e3
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b70080ee8b24b6c8611def9cca4a14352ea4e6ac84cdf65e06b5073f12da4ea
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f91d14e578100b24ae0d58cd4e34ab0091de9b526d6d966d3ab267afc8291596
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -53,3 +53,13 @@
53
  {"current_steps": 53, "total_steps": 117, "loss": 0.1868, "lr": 6.686649936914151e-06, "epoch": 5.556962025316456, "percentage": 45.3, "elapsed_time": "0:26:52", "remaining_time": "0:32:26"}
54
  {"current_steps": 54, "total_steps": 117, "loss": 0.1927, "lr": 6.545084971874738e-06, "epoch": 5.658227848101266, "percentage": 46.15, "elapsed_time": "0:27:12", "remaining_time": "0:31:44"}
55
  {"current_steps": 55, "total_steps": 117, "loss": 0.3279, "lr": 6.402136946530014e-06, "epoch": 5.759493670886076, "percentage": 47.01, "elapsed_time": "0:27:47", "remaining_time": "0:31:19"}
 
 
 
 
 
 
 
 
 
 
 
53
  {"current_steps": 53, "total_steps": 117, "loss": 0.1868, "lr": 6.686649936914151e-06, "epoch": 5.556962025316456, "percentage": 45.3, "elapsed_time": "0:26:52", "remaining_time": "0:32:26"}
54
  {"current_steps": 54, "total_steps": 117, "loss": 0.1927, "lr": 6.545084971874738e-06, "epoch": 5.658227848101266, "percentage": 46.15, "elapsed_time": "0:27:12", "remaining_time": "0:31:44"}
55
  {"current_steps": 55, "total_steps": 117, "loss": 0.3279, "lr": 6.402136946530014e-06, "epoch": 5.759493670886076, "percentage": 47.01, "elapsed_time": "0:27:47", "remaining_time": "0:31:19"}
56
+ {"current_steps": 56, "total_steps": 117, "loss": 0.209, "lr": 6.257933818722544e-06, "epoch": 5.860759493670886, "percentage": 47.86, "elapsed_time": "0:28:08", "remaining_time": "0:30:38"}
57
+ {"current_steps": 57, "total_steps": 117, "loss": 0.2742, "lr": 6.112604669781572e-06, "epoch": 5.962025316455696, "percentage": 48.72, "elapsed_time": "0:28:35", "remaining_time": "0:30:05"}
58
+ {"current_steps": 58, "total_steps": 117, "loss": 0.2199, "lr": 5.9662795889777666e-06, "epoch": 6.10126582278481, "percentage": 49.57, "elapsed_time": "0:30:10", "remaining_time": "0:30:41"}
59
+ {"current_steps": 59, "total_steps": 117, "loss": 0.1918, "lr": 5.819089557075689e-06, "epoch": 6.2025316455696204, "percentage": 50.43, "elapsed_time": "0:30:27", "remaining_time": "0:29:56"}
60
+ {"current_steps": 60, "total_steps": 117, "loss": 0.197, "lr": 5.671166329088278e-06, "epoch": 6.30379746835443, "percentage": 51.28, "elapsed_time": "0:30:53", "remaining_time": "0:29:21"}
61
+ {"current_steps": 61, "total_steps": 117, "loss": 0.1614, "lr": 5.522642316338268e-06, "epoch": 6.405063291139241, "percentage": 52.14, "elapsed_time": "0:31:14", "remaining_time": "0:28:40"}
62
+ {"current_steps": 62, "total_steps": 117, "loss": 0.2126, "lr": 5.373650467932122e-06, "epoch": 6.506329113924051, "percentage": 52.99, "elapsed_time": "0:31:37", "remaining_time": "0:28:02"}
63
+ {"current_steps": 63, "total_steps": 117, "loss": 0.1935, "lr": 5.224324151752575e-06, "epoch": 6.6075949367088604, "percentage": 53.85, "elapsed_time": "0:32:01", "remaining_time": "0:27:26"}
64
+ {"current_steps": 64, "total_steps": 117, "loss": 0.1897, "lr": 5.074797035076319e-06, "epoch": 6.708860759493671, "percentage": 54.7, "elapsed_time": "0:32:19", "remaining_time": "0:26:46"}
65
+ {"current_steps": 65, "total_steps": 117, "loss": 0.2797, "lr": 4.9252029649236835e-06, "epoch": 6.810126582278481, "percentage": 55.56, "elapsed_time": "0:32:52", "remaining_time": "0:26:18"}