gsmyrnis commited on
Commit
6d366c1
·
verified ·
1 Parent(s): bb79b78

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16cc5d1bb125c57ea6fc869aab20aadadfc0fbd3a605d8fb5dca06b7e9e0f664
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d04304e3e4d5c1e17e2611a7b980a66b797f2b3c91777dc987c20b4ebf6af7a
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fc6280e247bfa5498fcd135deaba4f49564dd7bbc7d72b0e2bb7cc72e76b8e7
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f8daf5f19f565b2f5bf25812b4323eeb3a518a4fbbc3883a5bc28bf2580ff6a
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4bcded7b7a7fe7b92f574fac2147157021d11e42ba89a3b59d597b23927ce51
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:968d19c8108eb796f9aa5017183fd3f81c5304053e3b6629aea04b93b1b4de92
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2424a1ca29871a3d27cc4dcd40acf224b038934d6344ac3c4c786c97400fb765
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:810a85fbfd8fabf299d7974bf3aed9b5e87092a500f6d18517324f0be51ad722
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -281,3 +281,33 @@
281
  {"current_steps": 281, "total_steps": 312, "loss": 0.4308, "lr": 2.9940862715390483e-07, "epoch": 2.693290734824281, "percentage": 90.06, "elapsed_time": "1:17:43", "remaining_time": "0:08:34"}
282
  {"current_steps": 282, "total_steps": 312, "loss": 0.4411, "lr": 2.8058334845816214e-07, "epoch": 2.702875399361022, "percentage": 90.38, "elapsed_time": "1:17:57", "remaining_time": "0:08:17"}
283
  {"current_steps": 283, "total_steps": 312, "loss": 0.4232, "lr": 2.6235218056235633e-07, "epoch": 2.7124600638977636, "percentage": 90.71, "elapsed_time": "1:18:14", "remaining_time": "0:08:01"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
281
  {"current_steps": 281, "total_steps": 312, "loss": 0.4308, "lr": 2.9940862715390483e-07, "epoch": 2.693290734824281, "percentage": 90.06, "elapsed_time": "1:17:43", "remaining_time": "0:08:34"}
282
  {"current_steps": 282, "total_steps": 312, "loss": 0.4411, "lr": 2.8058334845816214e-07, "epoch": 2.702875399361022, "percentage": 90.38, "elapsed_time": "1:17:57", "remaining_time": "0:08:17"}
283
  {"current_steps": 283, "total_steps": 312, "loss": 0.4232, "lr": 2.6235218056235633e-07, "epoch": 2.7124600638977636, "percentage": 90.71, "elapsed_time": "1:18:14", "remaining_time": "0:08:01"}
284
+ {"current_steps": 284, "total_steps": 312, "loss": 0.46, "lr": 2.447174185242324e-07, "epoch": 2.722044728434505, "percentage": 91.03, "elapsed_time": "1:18:32", "remaining_time": "0:07:44"}
285
+ {"current_steps": 285, "total_steps": 312, "loss": 0.3887, "lr": 2.276812823220964e-07, "epoch": 2.731629392971246, "percentage": 91.35, "elapsed_time": "1:18:50", "remaining_time": "0:07:28"}
286
+ {"current_steps": 286, "total_steps": 312, "loss": 0.4616, "lr": 2.1124591657534776e-07, "epoch": 2.741214057507987, "percentage": 91.67, "elapsed_time": "1:19:05", "remaining_time": "0:07:11"}
287
+ {"current_steps": 287, "total_steps": 312, "loss": 0.4318, "lr": 1.9541339027450256e-07, "epoch": 2.7507987220447285, "percentage": 91.99, "elapsed_time": "1:19:21", "remaining_time": "0:06:54"}
288
+ {"current_steps": 288, "total_steps": 312, "loss": 0.396, "lr": 1.801856965207338e-07, "epoch": 2.7603833865814695, "percentage": 92.31, "elapsed_time": "1:19:38", "remaining_time": "0:06:38"}
289
+ {"current_steps": 289, "total_steps": 312, "loss": 0.419, "lr": 1.6556475227496816e-07, "epoch": 2.769968051118211, "percentage": 92.63, "elapsed_time": "1:19:55", "remaining_time": "0:06:21"}
290
+ {"current_steps": 290, "total_steps": 312, "loss": 0.4476, "lr": 1.5155239811656562e-07, "epoch": 2.779552715654952, "percentage": 92.95, "elapsed_time": "1:20:10", "remaining_time": "0:06:04"}
291
+ {"current_steps": 291, "total_steps": 312, "loss": 0.404, "lr": 1.3815039801161723e-07, "epoch": 2.7891373801916934, "percentage": 93.27, "elapsed_time": "1:20:27", "remaining_time": "0:05:48"}
292
+ {"current_steps": 292, "total_steps": 312, "loss": 0.3836, "lr": 1.253604390908819e-07, "epoch": 2.7987220447284344, "percentage": 93.59, "elapsed_time": "1:20:43", "remaining_time": "0:05:31"}
293
+ {"current_steps": 293, "total_steps": 312, "loss": 0.4827, "lr": 1.1318413143740436e-07, "epoch": 2.8083067092651754, "percentage": 93.91, "elapsed_time": "1:21:00", "remaining_time": "0:05:15"}
294
+ {"current_steps": 294, "total_steps": 312, "loss": 0.4143, "lr": 1.0162300788382263e-07, "epoch": 2.817891373801917, "percentage": 94.23, "elapsed_time": "1:21:16", "remaining_time": "0:04:58"}
295
+ {"current_steps": 295, "total_steps": 312, "loss": 0.3934, "lr": 9.0678523819408e-08, "epoch": 2.8274760383386583, "percentage": 94.55, "elapsed_time": "1:21:33", "remaining_time": "0:04:41"}
296
+ {"current_steps": 296, "total_steps": 312, "loss": 0.4563, "lr": 8.035205700685167e-08, "epoch": 2.8370607028753994, "percentage": 94.87, "elapsed_time": "1:21:49", "remaining_time": "0:04:25"}
297
+ {"current_steps": 297, "total_steps": 312, "loss": 0.4202, "lr": 7.064490740882057e-08, "epoch": 2.8466453674121404, "percentage": 95.19, "elapsed_time": "1:22:07", "remaining_time": "0:04:08"}
298
+ {"current_steps": 298, "total_steps": 312, "loss": 0.4287, "lr": 6.15582970243117e-08, "epoch": 2.856230031948882, "percentage": 95.51, "elapsed_time": "1:22:24", "remaining_time": "0:03:52"}
299
+ {"current_steps": 299, "total_steps": 312, "loss": 0.4808, "lr": 5.3093369734816824e-08, "epoch": 2.8658146964856233, "percentage": 95.83, "elapsed_time": "1:22:43", "remaining_time": "0:03:35"}
300
+ {"current_steps": 300, "total_steps": 312, "loss": 0.4645, "lr": 4.52511911603265e-08, "epoch": 2.8753993610223643, "percentage": 96.15, "elapsed_time": "1:22:58", "remaining_time": "0:03:19"}
301
+ {"current_steps": 301, "total_steps": 312, "loss": 0.3763, "lr": 3.8032748525179684e-08, "epoch": 2.8849840255591053, "percentage": 96.47, "elapsed_time": "1:23:13", "remaining_time": "0:03:02"}
302
+ {"current_steps": 302, "total_steps": 312, "loss": 0.4531, "lr": 3.143895053378698e-08, "epoch": 2.8945686900958467, "percentage": 96.79, "elapsed_time": "1:23:30", "remaining_time": "0:02:45"}
303
+ {"current_steps": 303, "total_steps": 312, "loss": 0.3988, "lr": 2.547062725623828e-08, "epoch": 2.9041533546325877, "percentage": 97.12, "elapsed_time": "1:23:47", "remaining_time": "0:02:29"}
304
+ {"current_steps": 304, "total_steps": 312, "loss": 0.4257, "lr": 2.012853002380466e-08, "epoch": 2.913738019169329, "percentage": 97.44, "elapsed_time": "1:24:03", "remaining_time": "0:02:12"}
305
+ {"current_steps": 305, "total_steps": 312, "loss": 0.4586, "lr": 1.541333133436018e-08, "epoch": 2.92332268370607, "percentage": 97.76, "elapsed_time": "1:24:18", "remaining_time": "0:01:56"}
306
+ {"current_steps": 306, "total_steps": 312, "loss": 0.4507, "lr": 1.132562476771959e-08, "epoch": 2.9329073482428116, "percentage": 98.08, "elapsed_time": "1:24:34", "remaining_time": "0:01:39"}
307
+ {"current_steps": 307, "total_steps": 312, "loss": 0.4184, "lr": 7.865924910916977e-09, "epoch": 2.9424920127795526, "percentage": 98.4, "elapsed_time": "1:24:48", "remaining_time": "0:01:22"}
308
+ {"current_steps": 308, "total_steps": 312, "loss": 0.3953, "lr": 5.034667293427053e-09, "epoch": 2.952076677316294, "percentage": 98.72, "elapsed_time": "1:25:06", "remaining_time": "0:01:06"}
309
+ {"current_steps": 309, "total_steps": 312, "loss": 0.4028, "lr": 2.8322083323334417e-09, "epoch": 2.961661341853035, "percentage": 99.04, "elapsed_time": "1:25:22", "remaining_time": "0:00:49"}
310
+ {"current_steps": 310, "total_steps": 312, "loss": 0.4173, "lr": 1.2588252874673469e-09, "epoch": 2.9712460063897765, "percentage": 99.36, "elapsed_time": "1:25:38", "remaining_time": "0:00:33"}
311
+ {"current_steps": 311, "total_steps": 312, "loss": 0.3893, "lr": 3.147162264971471e-10, "epoch": 2.9808306709265175, "percentage": 99.68, "elapsed_time": "1:25:55", "remaining_time": "0:00:16"}
312
+ {"current_steps": 312, "total_steps": 312, "loss": 0.4429, "lr": 0.0, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "1:26:12", "remaining_time": "0:00:00"}
313
+ {"current_steps": 312, "total_steps": 312, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "1:29:00", "remaining_time": "0:00:00"}