penfever commited on
Commit
465949d
·
verified ·
1 Parent(s): 35d1e21

Training in progress, step 9000

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0bea2294954e12f121f7e94d85fda7c7245728ed5984316f4a55409084ca9e74
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb4f58a97325a61064ff38d47ca017e5d6b8c7707e8f7ee5e931ad790f5eb7aa
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:497ecf0d286f382b71e3c3094ba2b0aaddb606ebe3997d1ecbec8d6e79399e42
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c294157d1a1b3ac37e17eefa37d8ad243df87b74e4b473f8c8d78f2781fbe314
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a3a924de21f7e5f5ddf8de1a2d51e3e0de5d6a737f0d622b85cfda689ba679c
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8e3683e0a62e25128ac9e62fa528d912a726ddfcb0adbe69d697eb3d9d201b0
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c54be22b3807c8db115c8f46225d471a06fed0d353a0cf3fbdfd5a81ecab371
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:093d0fa42b610cb32cd7733363aa22b1e46fa617245fb894e2b35237f5d412cd
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1547,3 +1547,272 @@
1547
  {"current_steps": 7735, "total_steps": 12698, "loss": 0.1309, "lr": 1.590560613497172e-05, "epoch": 4.2640573318632855, "percentage": 60.92, "elapsed_time": "14:10:20", "remaining_time": "9:05:36"}
1548
  {"current_steps": 7740, "total_steps": 12698, "loss": 0.1322, "lr": 1.587870192811439e-05, "epoch": 4.266813671444322, "percentage": 60.95, "elapsed_time": "14:10:33", "remaining_time": "9:04:50"}
1549
  {"current_steps": 7745, "total_steps": 12698, "loss": 0.1396, "lr": 1.5851805507594987e-05, "epoch": 4.269570011025358, "percentage": 60.99, "elapsed_time": "14:10:48", "remaining_time": "9:04:05"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1547
  {"current_steps": 7735, "total_steps": 12698, "loss": 0.1309, "lr": 1.590560613497172e-05, "epoch": 4.2640573318632855, "percentage": 60.92, "elapsed_time": "14:10:20", "remaining_time": "9:05:36"}
1548
  {"current_steps": 7740, "total_steps": 12698, "loss": 0.1322, "lr": 1.587870192811439e-05, "epoch": 4.266813671444322, "percentage": 60.95, "elapsed_time": "14:10:33", "remaining_time": "9:04:50"}
1549
  {"current_steps": 7745, "total_steps": 12698, "loss": 0.1396, "lr": 1.5851805507594987e-05, "epoch": 4.269570011025358, "percentage": 60.99, "elapsed_time": "14:10:48", "remaining_time": "9:04:05"}
1550
+ {"current_steps": 7750, "total_steps": 12698, "loss": 0.1444, "lr": 1.582491692422872e-05, "epoch": 4.272326350606395, "percentage": 61.03, "elapsed_time": "14:11:01", "remaining_time": "9:03:20"}
1551
+ {"current_steps": 7755, "total_steps": 12698, "loss": 0.1334, "lr": 1.5798036228815988e-05, "epoch": 4.275082690187431, "percentage": 61.07, "elapsed_time": "14:11:13", "remaining_time": "9:02:34"}
1552
+ {"current_steps": 7760, "total_steps": 12698, "loss": 0.1257, "lr": 1.57711634721423e-05, "epoch": 4.277839029768468, "percentage": 61.11, "elapsed_time": "14:11:26", "remaining_time": "9:01:48"}
1553
+ {"current_steps": 7765, "total_steps": 12698, "loss": 0.14, "lr": 1.5744298704978135e-05, "epoch": 4.280595369349504, "percentage": 61.15, "elapsed_time": "14:11:39", "remaining_time": "9:01:02"}
1554
+ {"current_steps": 7770, "total_steps": 12698, "loss": 0.1275, "lr": 1.5717441978078914e-05, "epoch": 4.283351708930541, "percentage": 61.19, "elapsed_time": "14:11:51", "remaining_time": "9:00:16"}
1555
+ {"current_steps": 7775, "total_steps": 12698, "loss": 0.1274, "lr": 1.5690593342184854e-05, "epoch": 4.286108048511577, "percentage": 61.23, "elapsed_time": "14:12:03", "remaining_time": "8:59:30"}
1556
+ {"current_steps": 7780, "total_steps": 12698, "loss": 0.1255, "lr": 1.5663752848020875e-05, "epoch": 4.288864388092613, "percentage": 61.27, "elapsed_time": "14:12:15", "remaining_time": "8:58:44"}
1557
+ {"current_steps": 7785, "total_steps": 12698, "loss": 0.134, "lr": 1.5636920546296533e-05, "epoch": 4.291620727673649, "percentage": 61.31, "elapsed_time": "14:12:28", "remaining_time": "8:57:59"}
1558
+ {"current_steps": 7790, "total_steps": 12698, "loss": 0.1375, "lr": 1.561009648770589e-05, "epoch": 4.294377067254686, "percentage": 61.35, "elapsed_time": "14:12:40", "remaining_time": "8:57:13"}
1559
+ {"current_steps": 7795, "total_steps": 12698, "loss": 0.1287, "lr": 1.5583280722927437e-05, "epoch": 4.297133406835722, "percentage": 61.39, "elapsed_time": "14:12:53", "remaining_time": "8:56:27"}
1560
+ {"current_steps": 7800, "total_steps": 12698, "loss": 0.1309, "lr": 1.5556473302624017e-05, "epoch": 4.299889746416759, "percentage": 61.43, "elapsed_time": "14:13:06", "remaining_time": "8:55:42"}
1561
+ {"current_steps": 7805, "total_steps": 12698, "loss": 0.1335, "lr": 1.5529674277442674e-05, "epoch": 4.302646085997795, "percentage": 61.47, "elapsed_time": "14:13:19", "remaining_time": "8:54:57"}
1562
+ {"current_steps": 7810, "total_steps": 12698, "loss": 0.1356, "lr": 1.5502883698014614e-05, "epoch": 4.305402425578832, "percentage": 61.51, "elapsed_time": "14:13:31", "remaining_time": "8:54:11"}
1563
+ {"current_steps": 7815, "total_steps": 12698, "loss": 0.1319, "lr": 1.547610161495508e-05, "epoch": 4.308158765159868, "percentage": 61.55, "elapsed_time": "14:13:44", "remaining_time": "8:53:26"}
1564
+ {"current_steps": 7820, "total_steps": 12698, "loss": 0.1305, "lr": 1.5449328078863265e-05, "epoch": 4.3109151047409044, "percentage": 61.58, "elapsed_time": "14:13:56", "remaining_time": "8:52:40"}
1565
+ {"current_steps": 7825, "total_steps": 12698, "loss": 0.1249, "lr": 1.5422563140322208e-05, "epoch": 4.31367144432194, "percentage": 61.62, "elapsed_time": "14:14:08", "remaining_time": "8:51:54"}
1566
+ {"current_steps": 7830, "total_steps": 12698, "loss": 0.1408, "lr": 1.5395806849898713e-05, "epoch": 4.316427783902977, "percentage": 61.66, "elapsed_time": "14:14:22", "remaining_time": "8:51:10"}
1567
+ {"current_steps": 7835, "total_steps": 12698, "loss": 0.1368, "lr": 1.536905925814324e-05, "epoch": 4.319184123484013, "percentage": 61.7, "elapsed_time": "14:14:35", "remaining_time": "8:50:25"}
1568
+ {"current_steps": 7840, "total_steps": 12698, "loss": 0.126, "lr": 1.5342320415589816e-05, "epoch": 4.32194046306505, "percentage": 61.74, "elapsed_time": "14:14:47", "remaining_time": "8:49:39"}
1569
+ {"current_steps": 7845, "total_steps": 12698, "loss": 0.1312, "lr": 1.531559037275594e-05, "epoch": 4.324696802646086, "percentage": 61.78, "elapsed_time": "14:14:58", "remaining_time": "8:48:54"}
1570
+ {"current_steps": 7850, "total_steps": 12698, "loss": 0.1403, "lr": 1.5288869180142482e-05, "epoch": 4.327453142227123, "percentage": 61.82, "elapsed_time": "14:15:11", "remaining_time": "8:48:09"}
1571
+ {"current_steps": 7855, "total_steps": 12698, "loss": 0.1319, "lr": 1.5262156888233596e-05, "epoch": 4.330209481808159, "percentage": 61.86, "elapsed_time": "14:15:24", "remaining_time": "8:47:24"}
1572
+ {"current_steps": 7860, "total_steps": 12698, "loss": 0.1337, "lr": 1.523545354749661e-05, "epoch": 4.3329658213891955, "percentage": 61.9, "elapsed_time": "14:15:36", "remaining_time": "8:46:38"}
1573
+ {"current_steps": 7865, "total_steps": 12698, "loss": 0.1357, "lr": 1.5208759208381952e-05, "epoch": 4.335722160970231, "percentage": 61.94, "elapsed_time": "14:15:48", "remaining_time": "8:45:53"}
1574
+ {"current_steps": 7870, "total_steps": 12698, "loss": 0.1309, "lr": 1.5182073921323044e-05, "epoch": 4.338478500551268, "percentage": 61.98, "elapsed_time": "14:16:00", "remaining_time": "8:45:07"}
1575
+ {"current_steps": 7875, "total_steps": 12698, "loss": 0.1373, "lr": 1.5155397736736197e-05, "epoch": 4.341234840132304, "percentage": 62.02, "elapsed_time": "14:16:13", "remaining_time": "8:44:23"}
1576
+ {"current_steps": 7880, "total_steps": 12698, "loss": 0.1428, "lr": 1.5128730705020528e-05, "epoch": 4.343991179713341, "percentage": 62.06, "elapsed_time": "14:16:26", "remaining_time": "8:43:39"}
1577
+ {"current_steps": 7885, "total_steps": 12698, "loss": 0.1386, "lr": 1.5102072876557867e-05, "epoch": 4.346747519294377, "percentage": 62.1, "elapsed_time": "14:16:42", "remaining_time": "8:42:55"}
1578
+ {"current_steps": 7890, "total_steps": 12698, "loss": 0.1404, "lr": 1.5075424301712645e-05, "epoch": 4.349503858875414, "percentage": 62.14, "elapsed_time": "14:16:54", "remaining_time": "8:42:11"}
1579
+ {"current_steps": 7895, "total_steps": 12698, "loss": 0.1264, "lr": 1.5048785030831821e-05, "epoch": 4.35226019845645, "percentage": 62.18, "elapsed_time": "14:17:05", "remaining_time": "8:41:25"}
1580
+ {"current_steps": 7900, "total_steps": 12698, "loss": 0.132, "lr": 1.5022155114244773e-05, "epoch": 4.355016538037487, "percentage": 62.21, "elapsed_time": "14:17:18", "remaining_time": "8:40:40"}
1581
+ {"current_steps": 7905, "total_steps": 12698, "loss": 0.1354, "lr": 1.499553460226321e-05, "epoch": 4.3577728776185225, "percentage": 62.25, "elapsed_time": "14:17:30", "remaining_time": "8:39:55"}
1582
+ {"current_steps": 7910, "total_steps": 12698, "loss": 0.1329, "lr": 1.4968923545181055e-05, "epoch": 4.360529217199559, "percentage": 62.29, "elapsed_time": "14:17:43", "remaining_time": "8:39:11"}
1583
+ {"current_steps": 7915, "total_steps": 12698, "loss": 0.1245, "lr": 1.4942321993274387e-05, "epoch": 4.363285556780595, "percentage": 62.33, "elapsed_time": "14:17:55", "remaining_time": "8:38:26"}
1584
+ {"current_steps": 7920, "total_steps": 12698, "loss": 0.1423, "lr": 1.4915729996801326e-05, "epoch": 4.366041896361632, "percentage": 62.37, "elapsed_time": "14:18:07", "remaining_time": "8:37:41"}
1585
+ {"current_steps": 7925, "total_steps": 12698, "loss": 0.1402, "lr": 1.4889147606001932e-05, "epoch": 4.368798235942668, "percentage": 62.41, "elapsed_time": "14:18:20", "remaining_time": "8:36:57"}
1586
+ {"current_steps": 7930, "total_steps": 12698, "loss": 0.1348, "lr": 1.4862574871098118e-05, "epoch": 4.371554575523705, "percentage": 62.45, "elapsed_time": "14:18:33", "remaining_time": "8:36:12"}
1587
+ {"current_steps": 7935, "total_steps": 12698, "loss": 0.1317, "lr": 1.4836011842293554e-05, "epoch": 4.374310915104741, "percentage": 62.49, "elapsed_time": "14:18:48", "remaining_time": "8:35:29"}
1588
+ {"current_steps": 7940, "total_steps": 12698, "loss": 0.1166, "lr": 1.4809458569773569e-05, "epoch": 4.377067254685778, "percentage": 62.53, "elapsed_time": "14:19:03", "remaining_time": "8:34:47"}
1589
+ {"current_steps": 7945, "total_steps": 12698, "loss": 0.1276, "lr": 1.4782915103705076e-05, "epoch": 4.379823594266814, "percentage": 62.57, "elapsed_time": "14:19:15", "remaining_time": "8:34:02"}
1590
+ {"current_steps": 7950, "total_steps": 12698, "loss": 0.1289, "lr": 1.4756381494236443e-05, "epoch": 4.38257993384785, "percentage": 62.61, "elapsed_time": "14:19:27", "remaining_time": "8:33:17"}
1591
+ {"current_steps": 7955, "total_steps": 12698, "loss": 0.1325, "lr": 1.4729857791497417e-05, "epoch": 4.385336273428886, "percentage": 62.65, "elapsed_time": "14:19:41", "remaining_time": "8:32:34"}
1592
+ {"current_steps": 7960, "total_steps": 12698, "loss": 0.1311, "lr": 1.4703344045599037e-05, "epoch": 4.388092613009923, "percentage": 62.69, "elapsed_time": "14:19:53", "remaining_time": "8:31:49"}
1593
+ {"current_steps": 7965, "total_steps": 12698, "loss": 0.1371, "lr": 1.467684030663353e-05, "epoch": 4.390848952590959, "percentage": 62.73, "elapsed_time": "14:20:06", "remaining_time": "8:31:05"}
1594
+ {"current_steps": 7970, "total_steps": 12698, "loss": 0.1314, "lr": 1.4650346624674212e-05, "epoch": 4.393605292171996, "percentage": 62.77, "elapsed_time": "14:20:18", "remaining_time": "8:30:21"}
1595
+ {"current_steps": 7975, "total_steps": 12698, "loss": 0.1725, "lr": 1.46238630497754e-05, "epoch": 4.396361631753032, "percentage": 62.81, "elapsed_time": "14:20:38", "remaining_time": "8:29:41"}
1596
+ {"current_steps": 7980, "total_steps": 12698, "loss": 0.2388, "lr": 1.4597389631972314e-05, "epoch": 4.399117971334069, "percentage": 62.84, "elapsed_time": "14:21:29", "remaining_time": "8:29:20"}
1597
+ {"current_steps": 7985, "total_steps": 12698, "loss": 0.2295, "lr": 1.4570926421280982e-05, "epoch": 4.401874310915105, "percentage": 62.88, "elapsed_time": "14:22:17", "remaining_time": "8:28:57"}
1598
+ {"current_steps": 7990, "total_steps": 12698, "loss": 0.2223, "lr": 1.4544473467698165e-05, "epoch": 4.404630650496141, "percentage": 62.92, "elapsed_time": "14:23:13", "remaining_time": "8:28:38"}
1599
+ {"current_steps": 7995, "total_steps": 12698, "loss": 0.2136, "lr": 1.4518030821201223e-05, "epoch": 4.407386990077177, "percentage": 62.96, "elapsed_time": "14:24:05", "remaining_time": "8:28:17"}
1600
+ {"current_steps": 8000, "total_steps": 12698, "loss": 0.2328, "lr": 1.4491598531748053e-05, "epoch": 4.410143329658214, "percentage": 63.0, "elapsed_time": "14:24:58", "remaining_time": "8:27:57"}
1601
+ {"current_steps": 8005, "total_steps": 12698, "loss": 0.2177, "lr": 1.4465176649276984e-05, "epoch": 4.41289966923925, "percentage": 63.04, "elapsed_time": "14:25:48", "remaining_time": "8:27:35"}
1602
+ {"current_steps": 8010, "total_steps": 12698, "loss": 0.2272, "lr": 1.443876522370668e-05, "epoch": 4.415656008820287, "percentage": 63.08, "elapsed_time": "14:26:43", "remaining_time": "8:27:15"}
1603
+ {"current_steps": 8015, "total_steps": 12698, "loss": 0.2166, "lr": 1.441236430493606e-05, "epoch": 4.418412348401323, "percentage": 63.12, "elapsed_time": "14:27:28", "remaining_time": "8:26:51"}
1604
+ {"current_steps": 8020, "total_steps": 12698, "loss": 0.2308, "lr": 1.4385973942844178e-05, "epoch": 4.42116868798236, "percentage": 63.16, "elapsed_time": "14:28:29", "remaining_time": "8:26:34"}
1605
+ {"current_steps": 8025, "total_steps": 12698, "loss": 0.2269, "lr": 1.4359594187290151e-05, "epoch": 4.423925027563396, "percentage": 63.2, "elapsed_time": "14:29:10", "remaining_time": "8:26:07"}
1606
+ {"current_steps": 8030, "total_steps": 12698, "loss": 0.211, "lr": 1.4333225088113058e-05, "epoch": 4.4266813671444325, "percentage": 63.24, "elapsed_time": "14:30:15", "remaining_time": "8:25:53"}
1607
+ {"current_steps": 8035, "total_steps": 12698, "loss": 0.2255, "lr": 1.4306866695131837e-05, "epoch": 4.429437706725468, "percentage": 63.28, "elapsed_time": "14:31:00", "remaining_time": "8:25:28"}
1608
+ {"current_steps": 8040, "total_steps": 12698, "loss": 0.2188, "lr": 1.4280519058145212e-05, "epoch": 4.432194046306505, "percentage": 63.32, "elapsed_time": "14:31:49", "remaining_time": "8:25:05"}
1609
+ {"current_steps": 8045, "total_steps": 12698, "loss": 0.2142, "lr": 1.4254182226931574e-05, "epoch": 4.434950385887541, "percentage": 63.36, "elapsed_time": "14:32:19", "remaining_time": "8:24:31"}
1610
+ {"current_steps": 8050, "total_steps": 12698, "loss": 0.2156, "lr": 1.4227856251248904e-05, "epoch": 4.437706725468578, "percentage": 63.4, "elapsed_time": "14:32:45", "remaining_time": "8:23:55"}
1611
+ {"current_steps": 8055, "total_steps": 12698, "loss": 0.2079, "lr": 1.4201541180834673e-05, "epoch": 4.440463065049614, "percentage": 63.44, "elapsed_time": "14:33:12", "remaining_time": "8:23:19"}
1612
+ {"current_steps": 8060, "total_steps": 12698, "loss": 0.2176, "lr": 1.4175237065405745e-05, "epoch": 4.443219404630651, "percentage": 63.47, "elapsed_time": "14:33:38", "remaining_time": "8:22:43"}
1613
+ {"current_steps": 8065, "total_steps": 12698, "loss": 0.2225, "lr": 1.4148943954658299e-05, "epoch": 4.445975744211687, "percentage": 63.51, "elapsed_time": "14:34:03", "remaining_time": "8:22:06"}
1614
+ {"current_steps": 8070, "total_steps": 12698, "loss": 0.2227, "lr": 1.4122661898267706e-05, "epoch": 4.448732083792724, "percentage": 63.55, "elapsed_time": "14:34:29", "remaining_time": "8:21:30"}
1615
+ {"current_steps": 8075, "total_steps": 12698, "loss": 0.215, "lr": 1.4096390945888467e-05, "epoch": 4.4514884233737595, "percentage": 63.59, "elapsed_time": "14:34:58", "remaining_time": "8:20:55"}
1616
+ {"current_steps": 8080, "total_steps": 12698, "loss": 0.2032, "lr": 1.407013114715409e-05, "epoch": 4.454244762954796, "percentage": 63.63, "elapsed_time": "14:35:26", "remaining_time": "8:20:20"}
1617
+ {"current_steps": 8085, "total_steps": 12698, "loss": 0.2073, "lr": 1.4043882551677028e-05, "epoch": 4.457001102535832, "percentage": 63.67, "elapsed_time": "14:35:54", "remaining_time": "8:19:45"}
1618
+ {"current_steps": 8090, "total_steps": 12698, "loss": 0.1964, "lr": 1.4017645209048554e-05, "epoch": 4.459757442116869, "percentage": 63.71, "elapsed_time": "14:36:18", "remaining_time": "8:19:08"}
1619
+ {"current_steps": 8095, "total_steps": 12698, "loss": 0.2159, "lr": 1.3991419168838683e-05, "epoch": 4.462513781697905, "percentage": 63.75, "elapsed_time": "14:36:45", "remaining_time": "8:18:32"}
1620
+ {"current_steps": 8100, "total_steps": 12698, "loss": 0.2177, "lr": 1.396520448059608e-05, "epoch": 4.465270121278942, "percentage": 63.79, "elapsed_time": "14:37:10", "remaining_time": "8:17:56"}
1621
+ {"current_steps": 8105, "total_steps": 12698, "loss": 0.2009, "lr": 1.3939001193847955e-05, "epoch": 4.468026460859978, "percentage": 63.83, "elapsed_time": "14:37:38", "remaining_time": "8:17:20"}
1622
+ {"current_steps": 8110, "total_steps": 12698, "loss": 0.2059, "lr": 1.3912809358099995e-05, "epoch": 4.470782800441015, "percentage": 63.87, "elapsed_time": "14:38:02", "remaining_time": "8:16:43"}
1623
+ {"current_steps": 8115, "total_steps": 12698, "loss": 0.2081, "lr": 1.3886629022836238e-05, "epoch": 4.4735391400220506, "percentage": 63.91, "elapsed_time": "14:38:30", "remaining_time": "8:16:08"}
1624
+ {"current_steps": 8120, "total_steps": 12698, "loss": 0.2039, "lr": 1.3860460237518993e-05, "epoch": 4.476295479603087, "percentage": 63.95, "elapsed_time": "14:38:57", "remaining_time": "8:15:32"}
1625
+ {"current_steps": 8125, "total_steps": 12698, "loss": 0.2079, "lr": 1.3834303051588757e-05, "epoch": 4.479051819184123, "percentage": 63.99, "elapsed_time": "14:39:22", "remaining_time": "8:14:56"}
1626
+ {"current_steps": 8130, "total_steps": 12698, "loss": 0.2016, "lr": 1.3808157514464102e-05, "epoch": 4.48180815876516, "percentage": 64.03, "elapsed_time": "14:39:49", "remaining_time": "8:14:20"}
1627
+ {"current_steps": 8135, "total_steps": 12698, "loss": 0.203, "lr": 1.3782023675541606e-05, "epoch": 4.484564498346196, "percentage": 64.07, "elapsed_time": "14:40:14", "remaining_time": "8:13:43"}
1628
+ {"current_steps": 8140, "total_steps": 12698, "loss": 0.2006, "lr": 1.3755901584195728e-05, "epoch": 4.487320837927233, "percentage": 64.1, "elapsed_time": "14:40:43", "remaining_time": "8:13:09"}
1629
+ {"current_steps": 8145, "total_steps": 12698, "loss": 0.1999, "lr": 1.372979128977875e-05, "epoch": 4.490077177508269, "percentage": 64.14, "elapsed_time": "14:41:07", "remaining_time": "8:12:32"}
1630
+ {"current_steps": 8150, "total_steps": 12698, "loss": 0.2007, "lr": 1.3703692841620653e-05, "epoch": 4.492833517089306, "percentage": 64.18, "elapsed_time": "14:41:33", "remaining_time": "8:11:56"}
1631
+ {"current_steps": 8155, "total_steps": 12698, "loss": 0.2146, "lr": 1.367760628902904e-05, "epoch": 4.495589856670342, "percentage": 64.22, "elapsed_time": "14:41:56", "remaining_time": "8:11:18"}
1632
+ {"current_steps": 8160, "total_steps": 12698, "loss": 0.2028, "lr": 1.3651531681289048e-05, "epoch": 4.498346196251378, "percentage": 64.26, "elapsed_time": "14:42:26", "remaining_time": "8:10:45"}
1633
+ {"current_steps": 8165, "total_steps": 12698, "loss": 0.2018, "lr": 1.3625469067663237e-05, "epoch": 4.501102535832414, "percentage": 64.3, "elapsed_time": "14:42:53", "remaining_time": "8:10:09"}
1634
+ {"current_steps": 8170, "total_steps": 12698, "loss": 0.2049, "lr": 1.3599418497391512e-05, "epoch": 4.503858875413451, "percentage": 64.34, "elapsed_time": "14:43:23", "remaining_time": "8:09:35"}
1635
+ {"current_steps": 8175, "total_steps": 12698, "loss": 0.2079, "lr": 1.3573380019691019e-05, "epoch": 4.506615214994487, "percentage": 64.38, "elapsed_time": "14:43:49", "remaining_time": "8:08:59"}
1636
+ {"current_steps": 8180, "total_steps": 12698, "loss": 0.2028, "lr": 1.3547353683756056e-05, "epoch": 4.509371554575524, "percentage": 64.42, "elapsed_time": "14:44:13", "remaining_time": "8:08:22"}
1637
+ {"current_steps": 8185, "total_steps": 12698, "loss": 0.2021, "lr": 1.3521339538758e-05, "epoch": 4.51212789415656, "percentage": 64.46, "elapsed_time": "14:44:42", "remaining_time": "8:07:48"}
1638
+ {"current_steps": 8190, "total_steps": 12698, "loss": 0.2038, "lr": 1.3495337633845175e-05, "epoch": 4.514884233737597, "percentage": 64.5, "elapsed_time": "14:45:08", "remaining_time": "8:07:12"}
1639
+ {"current_steps": 8195, "total_steps": 12698, "loss": 0.1971, "lr": 1.3469348018142786e-05, "epoch": 4.517640573318633, "percentage": 64.54, "elapsed_time": "14:45:38", "remaining_time": "8:06:38"}
1640
+ {"current_steps": 8200, "total_steps": 12698, "loss": 0.1986, "lr": 1.3443370740752823e-05, "epoch": 4.5203969128996695, "percentage": 64.58, "elapsed_time": "14:46:02", "remaining_time": "8:06:01"}
1641
+ {"current_steps": 8205, "total_steps": 12698, "loss": 0.208, "lr": 1.3417405850753968e-05, "epoch": 4.523153252480705, "percentage": 64.62, "elapsed_time": "14:46:31", "remaining_time": "8:05:27"}
1642
+ {"current_steps": 8210, "total_steps": 12698, "loss": 0.204, "lr": 1.3391453397201493e-05, "epoch": 4.525909592061742, "percentage": 64.66, "elapsed_time": "14:46:58", "remaining_time": "8:04:52"}
1643
+ {"current_steps": 8215, "total_steps": 12698, "loss": 0.2183, "lr": 1.3365513429127172e-05, "epoch": 4.528665931642778, "percentage": 64.7, "elapsed_time": "14:47:23", "remaining_time": "8:04:15"}
1644
+ {"current_steps": 8220, "total_steps": 12698, "loss": 0.2001, "lr": 1.33395859955392e-05, "epoch": 4.531422271223815, "percentage": 64.73, "elapsed_time": "14:47:50", "remaining_time": "8:03:40"}
1645
+ {"current_steps": 8225, "total_steps": 12698, "loss": 0.2001, "lr": 1.3313671145422077e-05, "epoch": 4.534178610804851, "percentage": 64.77, "elapsed_time": "14:48:21", "remaining_time": "8:03:06"}
1646
+ {"current_steps": 8230, "total_steps": 12698, "loss": 0.2057, "lr": 1.328776892773655e-05, "epoch": 4.536934950385888, "percentage": 64.81, "elapsed_time": "14:48:44", "remaining_time": "8:02:29"}
1647
+ {"current_steps": 8235, "total_steps": 12698, "loss": 0.2019, "lr": 1.3261879391419478e-05, "epoch": 4.539691289966924, "percentage": 64.85, "elapsed_time": "14:49:13", "remaining_time": "8:01:55"}
1648
+ {"current_steps": 8240, "total_steps": 12698, "loss": 0.2001, "lr": 1.3236002585383774e-05, "epoch": 4.5424476295479606, "percentage": 64.89, "elapsed_time": "14:49:40", "remaining_time": "8:01:20"}
1649
+ {"current_steps": 8245, "total_steps": 12698, "loss": 0.1923, "lr": 1.3210138558518295e-05, "epoch": 4.5452039691289965, "percentage": 64.93, "elapsed_time": "14:50:06", "remaining_time": "8:00:44"}
1650
+ {"current_steps": 8250, "total_steps": 12698, "loss": 0.1856, "lr": 1.3184287359687751e-05, "epoch": 4.547960308710033, "percentage": 64.97, "elapsed_time": "14:50:33", "remaining_time": "8:00:08"}
1651
+ {"current_steps": 8255, "total_steps": 12698, "loss": 0.2213, "lr": 1.3158449037732628e-05, "epoch": 4.550716648291069, "percentage": 65.01, "elapsed_time": "14:50:59", "remaining_time": "7:59:33"}
1652
+ {"current_steps": 8260, "total_steps": 12698, "loss": 0.1965, "lr": 1.3132623641469074e-05, "epoch": 4.553472987872106, "percentage": 65.05, "elapsed_time": "14:51:32", "remaining_time": "7:59:00"}
1653
+ {"current_steps": 8265, "total_steps": 12698, "loss": 0.2129, "lr": 1.3106811219688815e-05, "epoch": 4.556229327453142, "percentage": 65.09, "elapsed_time": "14:52:02", "remaining_time": "7:58:27"}
1654
+ {"current_steps": 8270, "total_steps": 12698, "loss": 0.2031, "lr": 1.3081011821159075e-05, "epoch": 4.558985667034179, "percentage": 65.13, "elapsed_time": "14:52:32", "remaining_time": "7:57:53"}
1655
+ {"current_steps": 8275, "total_steps": 12698, "loss": 0.2099, "lr": 1.3055225494622459e-05, "epoch": 4.561742006615215, "percentage": 65.17, "elapsed_time": "14:53:00", "remaining_time": "7:57:18"}
1656
+ {"current_steps": 8280, "total_steps": 12698, "loss": 0.2021, "lr": 1.3029452288796886e-05, "epoch": 4.564498346196252, "percentage": 65.21, "elapsed_time": "14:53:27", "remaining_time": "7:56:43"}
1657
+ {"current_steps": 8285, "total_steps": 12698, "loss": 0.1938, "lr": 1.3003692252375486e-05, "epoch": 4.5672546857772875, "percentage": 65.25, "elapsed_time": "14:53:53", "remaining_time": "7:56:07"}
1658
+ {"current_steps": 8290, "total_steps": 12698, "loss": 0.1934, "lr": 1.2977945434026504e-05, "epoch": 4.570011025358324, "percentage": 65.29, "elapsed_time": "14:54:19", "remaining_time": "7:55:31"}
1659
+ {"current_steps": 8295, "total_steps": 12698, "loss": 0.1897, "lr": 1.2952211882393211e-05, "epoch": 4.57276736493936, "percentage": 65.33, "elapsed_time": "14:54:44", "remaining_time": "7:54:55"}
1660
+ {"current_steps": 8300, "total_steps": 12698, "loss": 0.1866, "lr": 1.292649164609381e-05, "epoch": 4.575523704520397, "percentage": 65.36, "elapsed_time": "14:55:10", "remaining_time": "7:54:20"}
1661
+ {"current_steps": 8305, "total_steps": 12698, "loss": 0.1943, "lr": 1.2900784773721365e-05, "epoch": 4.578280044101433, "percentage": 65.4, "elapsed_time": "14:55:39", "remaining_time": "7:53:46"}
1662
+ {"current_steps": 8310, "total_steps": 12698, "loss": 0.1809, "lr": 1.2875091313843674e-05, "epoch": 4.58103638368247, "percentage": 65.44, "elapsed_time": "14:56:04", "remaining_time": "7:53:09"}
1663
+ {"current_steps": 8315, "total_steps": 12698, "loss": 0.1913, "lr": 1.2849411315003199e-05, "epoch": 4.583792723263506, "percentage": 65.48, "elapsed_time": "14:56:31", "remaining_time": "7:52:34"}
1664
+ {"current_steps": 8320, "total_steps": 12698, "loss": 0.2208, "lr": 1.2823744825716974e-05, "epoch": 4.586549062844543, "percentage": 65.52, "elapsed_time": "14:56:56", "remaining_time": "7:51:58"}
1665
+ {"current_steps": 8325, "total_steps": 12698, "loss": 0.1921, "lr": 1.2798091894476503e-05, "epoch": 4.589305402425579, "percentage": 65.56, "elapsed_time": "14:57:22", "remaining_time": "7:51:22"}
1666
+ {"current_steps": 8330, "total_steps": 12698, "loss": 0.2001, "lr": 1.2772452569747685e-05, "epoch": 4.592061742006615, "percentage": 65.6, "elapsed_time": "14:57:48", "remaining_time": "7:50:46"}
1667
+ {"current_steps": 8335, "total_steps": 12698, "loss": 0.19, "lr": 1.2746826899970706e-05, "epoch": 4.594818081587651, "percentage": 65.64, "elapsed_time": "14:58:14", "remaining_time": "7:50:11"}
1668
+ {"current_steps": 8340, "total_steps": 12698, "loss": 0.1965, "lr": 1.2721214933559947e-05, "epoch": 4.597574421168688, "percentage": 65.68, "elapsed_time": "14:58:42", "remaining_time": "7:49:36"}
1669
+ {"current_steps": 8345, "total_steps": 12698, "loss": 0.1976, "lr": 1.269561671890391e-05, "epoch": 4.600330760749724, "percentage": 65.72, "elapsed_time": "14:59:13", "remaining_time": "7:49:03"}
1670
+ {"current_steps": 8350, "total_steps": 12698, "loss": 0.1847, "lr": 1.2670032304365116e-05, "epoch": 4.603087100330761, "percentage": 65.76, "elapsed_time": "14:59:41", "remaining_time": "7:48:29"}
1671
+ {"current_steps": 8355, "total_steps": 12698, "loss": 0.2014, "lr": 1.264446173828001e-05, "epoch": 4.605843439911797, "percentage": 65.8, "elapsed_time": "15:00:08", "remaining_time": "7:47:54"}
1672
+ {"current_steps": 8360, "total_steps": 12698, "loss": 0.1917, "lr": 1.2618905068958867e-05, "epoch": 4.608599779492834, "percentage": 65.84, "elapsed_time": "15:00:35", "remaining_time": "7:47:19"}
1673
+ {"current_steps": 8365, "total_steps": 12698, "loss": 0.1936, "lr": 1.2593362344685717e-05, "epoch": 4.61135611907387, "percentage": 65.88, "elapsed_time": "15:01:00", "remaining_time": "7:46:42"}
1674
+ {"current_steps": 8370, "total_steps": 12698, "loss": 0.2073, "lr": 1.2567833613718237e-05, "epoch": 4.6141124586549065, "percentage": 65.92, "elapsed_time": "15:01:30", "remaining_time": "7:46:09"}
1675
+ {"current_steps": 8375, "total_steps": 12698, "loss": 0.1988, "lr": 1.2542318924287678e-05, "epoch": 4.616868798235942, "percentage": 65.96, "elapsed_time": "15:01:57", "remaining_time": "7:45:34"}
1676
+ {"current_steps": 8380, "total_steps": 12698, "loss": 0.2077, "lr": 1.2516818324598742e-05, "epoch": 4.619625137816979, "percentage": 65.99, "elapsed_time": "15:02:23", "remaining_time": "7:44:58"}
1677
+ {"current_steps": 8385, "total_steps": 12698, "loss": 0.1976, "lr": 1.2491331862829532e-05, "epoch": 4.622381477398015, "percentage": 66.03, "elapsed_time": "15:02:47", "remaining_time": "7:44:22"}
1678
+ {"current_steps": 8390, "total_steps": 12698, "loss": 0.2146, "lr": 1.2465859587131428e-05, "epoch": 4.625137816979052, "percentage": 66.07, "elapsed_time": "15:03:15", "remaining_time": "7:43:47"}
1679
+ {"current_steps": 8395, "total_steps": 12698, "loss": 0.1984, "lr": 1.2440401545629009e-05, "epoch": 4.627894156560088, "percentage": 66.11, "elapsed_time": "15:03:43", "remaining_time": "7:43:13"}
1680
+ {"current_steps": 8400, "total_steps": 12698, "loss": 0.2032, "lr": 1.2414957786419967e-05, "epoch": 4.630650496141125, "percentage": 66.15, "elapsed_time": "15:04:08", "remaining_time": "7:42:37"}
1681
+ {"current_steps": 8405, "total_steps": 12698, "loss": 0.2018, "lr": 1.2389528357575013e-05, "epoch": 4.633406835722161, "percentage": 66.19, "elapsed_time": "15:04:40", "remaining_time": "7:42:04"}
1682
+ {"current_steps": 8410, "total_steps": 12698, "loss": 0.1947, "lr": 1.2364113307137773e-05, "epoch": 4.6361631753031975, "percentage": 66.23, "elapsed_time": "15:05:05", "remaining_time": "7:41:28"}
1683
+ {"current_steps": 8415, "total_steps": 12698, "loss": 0.1995, "lr": 1.2338712683124717e-05, "epoch": 4.6389195148842335, "percentage": 66.27, "elapsed_time": "15:05:30", "remaining_time": "7:40:52"}
1684
+ {"current_steps": 8420, "total_steps": 12698, "loss": 0.2005, "lr": 1.231332653352505e-05, "epoch": 4.64167585446527, "percentage": 66.31, "elapsed_time": "15:05:54", "remaining_time": "7:40:16"}
1685
+ {"current_steps": 8425, "total_steps": 12698, "loss": 0.192, "lr": 1.2287954906300638e-05, "epoch": 4.644432194046306, "percentage": 66.35, "elapsed_time": "15:06:21", "remaining_time": "7:39:41"}
1686
+ {"current_steps": 8430, "total_steps": 12698, "loss": 0.1849, "lr": 1.2262597849385908e-05, "epoch": 4.647188533627343, "percentage": 66.39, "elapsed_time": "15:06:53", "remaining_time": "7:39:09"}
1687
+ {"current_steps": 8435, "total_steps": 12698, "loss": 0.1987, "lr": 1.2237255410687766e-05, "epoch": 4.649944873208379, "percentage": 66.43, "elapsed_time": "15:07:22", "remaining_time": "7:38:34"}
1688
+ {"current_steps": 8440, "total_steps": 12698, "loss": 0.1837, "lr": 1.2211927638085487e-05, "epoch": 4.652701212789416, "percentage": 66.47, "elapsed_time": "15:07:49", "remaining_time": "7:37:59"}
1689
+ {"current_steps": 8445, "total_steps": 12698, "loss": 0.1992, "lr": 1.218661457943065e-05, "epoch": 4.655457552370452, "percentage": 66.51, "elapsed_time": "15:08:14", "remaining_time": "7:37:24"}
1690
+ {"current_steps": 8450, "total_steps": 12698, "loss": 0.1952, "lr": 1.2161316282547024e-05, "epoch": 4.658213891951489, "percentage": 66.55, "elapsed_time": "15:08:41", "remaining_time": "7:36:49"}
1691
+ {"current_steps": 8455, "total_steps": 12698, "loss": 0.1974, "lr": 1.2136032795230492e-05, "epoch": 4.6609702315325245, "percentage": 66.59, "elapsed_time": "15:09:09", "remaining_time": "7:36:14"}
1692
+ {"current_steps": 8460, "total_steps": 12698, "loss": 0.1898, "lr": 1.211076416524897e-05, "epoch": 4.663726571113561, "percentage": 66.62, "elapsed_time": "15:09:33", "remaining_time": "7:35:38"}
1693
+ {"current_steps": 8465, "total_steps": 12698, "loss": 0.2008, "lr": 1.2085510440342282e-05, "epoch": 4.666482910694597, "percentage": 66.66, "elapsed_time": "15:10:01", "remaining_time": "7:35:03"}
1694
+ {"current_steps": 8470, "total_steps": 12698, "loss": 0.1923, "lr": 1.2060271668222115e-05, "epoch": 4.669239250275634, "percentage": 66.7, "elapsed_time": "15:10:33", "remaining_time": "7:34:31"}
1695
+ {"current_steps": 8475, "total_steps": 12698, "loss": 0.1876, "lr": 1.2035047896571884e-05, "epoch": 4.67199558985667, "percentage": 66.74, "elapsed_time": "15:11:04", "remaining_time": "7:33:58"}
1696
+ {"current_steps": 8480, "total_steps": 12698, "loss": 0.1877, "lr": 1.2009839173046673e-05, "epoch": 4.674751929437707, "percentage": 66.78, "elapsed_time": "15:11:31", "remaining_time": "7:33:23"}
1697
+ {"current_steps": 8485, "total_steps": 12698, "loss": 0.1917, "lr": 1.1984645545273145e-05, "epoch": 4.677508269018743, "percentage": 66.82, "elapsed_time": "15:12:00", "remaining_time": "7:32:50"}
1698
+ {"current_steps": 8490, "total_steps": 12698, "loss": 0.1869, "lr": 1.1959467060849432e-05, "epoch": 4.68026460859978, "percentage": 66.86, "elapsed_time": "15:12:28", "remaining_time": "7:32:15"}
1699
+ {"current_steps": 8495, "total_steps": 12698, "loss": 0.1819, "lr": 1.1934303767345057e-05, "epoch": 4.683020948180816, "percentage": 66.9, "elapsed_time": "15:12:55", "remaining_time": "7:31:40"}
1700
+ {"current_steps": 8500, "total_steps": 12698, "loss": 0.1844, "lr": 1.1909155712300844e-05, "epoch": 4.685777287761852, "percentage": 66.94, "elapsed_time": "15:13:20", "remaining_time": "7:31:05"}
1701
+ {"current_steps": 8505, "total_steps": 12698, "loss": 0.1821, "lr": 1.1884022943228824e-05, "epoch": 4.688533627342888, "percentage": 66.98, "elapsed_time": "15:13:47", "remaining_time": "7:30:29"}
1702
+ {"current_steps": 8510, "total_steps": 12698, "loss": 0.2011, "lr": 1.1858905507612156e-05, "epoch": 4.691289966923925, "percentage": 67.02, "elapsed_time": "15:14:14", "remaining_time": "7:29:55"}
1703
+ {"current_steps": 8515, "total_steps": 12698, "loss": 0.1977, "lr": 1.1833803452905025e-05, "epoch": 4.694046306504961, "percentage": 67.06, "elapsed_time": "15:14:37", "remaining_time": "7:29:18"}
1704
+ {"current_steps": 8520, "total_steps": 12698, "loss": 0.183, "lr": 1.1808716826532556e-05, "epoch": 4.696802646085998, "percentage": 67.1, "elapsed_time": "15:15:04", "remaining_time": "7:28:43"}
1705
+ {"current_steps": 8525, "total_steps": 12698, "loss": 0.18, "lr": 1.1783645675890725e-05, "epoch": 4.699558985667034, "percentage": 67.14, "elapsed_time": "15:15:30", "remaining_time": "7:28:08"}
1706
+ {"current_steps": 8530, "total_steps": 12698, "loss": 0.1947, "lr": 1.175859004834627e-05, "epoch": 4.702315325248071, "percentage": 67.18, "elapsed_time": "15:15:56", "remaining_time": "7:27:33"}
1707
+ {"current_steps": 8535, "total_steps": 12698, "loss": 0.1888, "lr": 1.1733549991236608e-05, "epoch": 4.705071664829107, "percentage": 67.22, "elapsed_time": "15:16:23", "remaining_time": "7:26:58"}
1708
+ {"current_steps": 8540, "total_steps": 12698, "loss": 0.2004, "lr": 1.1708525551869729e-05, "epoch": 4.7078280044101435, "percentage": 67.25, "elapsed_time": "15:16:47", "remaining_time": "7:26:22"}
1709
+ {"current_steps": 8545, "total_steps": 12698, "loss": 0.1931, "lr": 1.1683516777524127e-05, "epoch": 4.710584343991179, "percentage": 67.29, "elapsed_time": "15:17:16", "remaining_time": "7:25:48"}
1710
+ {"current_steps": 8550, "total_steps": 12698, "loss": 0.1877, "lr": 1.1658523715448683e-05, "epoch": 4.713340683572216, "percentage": 67.33, "elapsed_time": "15:17:41", "remaining_time": "7:25:13"}
1711
+ {"current_steps": 8555, "total_steps": 12698, "loss": 0.1995, "lr": 1.1633546412862612e-05, "epoch": 4.716097023153252, "percentage": 67.37, "elapsed_time": "15:18:08", "remaining_time": "7:24:38"}
1712
+ {"current_steps": 8560, "total_steps": 12698, "loss": 0.1818, "lr": 1.1608584916955348e-05, "epoch": 4.718853362734289, "percentage": 67.41, "elapsed_time": "15:18:38", "remaining_time": "7:24:04"}
1713
+ {"current_steps": 8565, "total_steps": 12698, "loss": 0.1009, "lr": 1.1583639274886461e-05, "epoch": 4.721609702315325, "percentage": 67.45, "elapsed_time": "15:19:06", "remaining_time": "7:23:30"}
1714
+ {"current_steps": 8570, "total_steps": 12698, "loss": 0.0802, "lr": 1.155870953378556e-05, "epoch": 4.724366041896362, "percentage": 67.49, "elapsed_time": "15:19:31", "remaining_time": "7:22:55"}
1715
+ {"current_steps": 8575, "total_steps": 12698, "loss": 0.0779, "lr": 1.1533795740752228e-05, "epoch": 4.727122381477398, "percentage": 67.53, "elapsed_time": "15:19:58", "remaining_time": "7:22:20"}
1716
+ {"current_steps": 8580, "total_steps": 12698, "loss": 0.0921, "lr": 1.1508897942855902e-05, "epoch": 4.7298787210584345, "percentage": 67.57, "elapsed_time": "15:20:22", "remaining_time": "7:21:44"}
1717
+ {"current_steps": 8585, "total_steps": 12698, "loss": 0.077, "lr": 1.1484016187135815e-05, "epoch": 4.7326350606394705, "percentage": 67.61, "elapsed_time": "15:20:50", "remaining_time": "7:21:10"}
1718
+ {"current_steps": 8590, "total_steps": 12698, "loss": 0.1038, "lr": 1.1459150520600873e-05, "epoch": 4.735391400220507, "percentage": 67.65, "elapsed_time": "15:21:14", "remaining_time": "7:20:33"}
1719
+ {"current_steps": 8595, "total_steps": 12698, "loss": 0.1165, "lr": 1.143430099022961e-05, "epoch": 4.738147739801543, "percentage": 67.69, "elapsed_time": "15:21:44", "remaining_time": "7:20:00"}
1720
+ {"current_steps": 8600, "total_steps": 12698, "loss": 0.0865, "lr": 1.1409467642970053e-05, "epoch": 4.74090407938258, "percentage": 67.73, "elapsed_time": "15:22:07", "remaining_time": "7:19:24"}
1721
+ {"current_steps": 8605, "total_steps": 12698, "loss": 0.1099, "lr": 1.1384650525739662e-05, "epoch": 4.743660418963616, "percentage": 67.77, "elapsed_time": "15:22:50", "remaining_time": "7:18:57"}
1722
+ {"current_steps": 8610, "total_steps": 12698, "loss": 0.0804, "lr": 1.1359849685425232e-05, "epoch": 4.746416758544653, "percentage": 67.81, "elapsed_time": "15:23:32", "remaining_time": "7:18:29"}
1723
+ {"current_steps": 8615, "total_steps": 12698, "loss": 0.0768, "lr": 1.1335065168882807e-05, "epoch": 4.749173098125689, "percentage": 67.85, "elapsed_time": "15:24:12", "remaining_time": "7:18:01"}
1724
+ {"current_steps": 8620, "total_steps": 12698, "loss": 0.0792, "lr": 1.1310297022937589e-05, "epoch": 4.751929437706726, "percentage": 67.88, "elapsed_time": "15:24:40", "remaining_time": "7:17:26"}
1725
+ {"current_steps": 8625, "total_steps": 12698, "loss": 0.0941, "lr": 1.1285545294383855e-05, "epoch": 4.7546857772877615, "percentage": 67.92, "elapsed_time": "15:25:18", "remaining_time": "7:16:57"}
1726
+ {"current_steps": 8630, "total_steps": 12698, "loss": 0.1001, "lr": 1.1260810029984861e-05, "epoch": 4.757442116868798, "percentage": 67.96, "elapsed_time": "15:25:46", "remaining_time": "7:16:23"}
1727
+ {"current_steps": 8635, "total_steps": 12698, "loss": 0.0802, "lr": 1.1236091276472751e-05, "epoch": 4.760198456449834, "percentage": 68.0, "elapsed_time": "15:26:14", "remaining_time": "7:15:49"}
1728
+ {"current_steps": 8640, "total_steps": 12698, "loss": 0.0704, "lr": 1.1211389080548499e-05, "epoch": 4.762954796030871, "percentage": 68.04, "elapsed_time": "15:26:39", "remaining_time": "7:15:13"}
1729
+ {"current_steps": 8645, "total_steps": 12698, "loss": 0.0755, "lr": 1.1186703488881773e-05, "epoch": 4.765711135611907, "percentage": 68.08, "elapsed_time": "15:27:01", "remaining_time": "7:14:36"}
1730
+ {"current_steps": 8650, "total_steps": 12698, "loss": 0.0908, "lr": 1.116203454811088e-05, "epoch": 4.768467475192944, "percentage": 68.12, "elapsed_time": "15:27:22", "remaining_time": "7:13:59"}
1731
+ {"current_steps": 8655, "total_steps": 12698, "loss": 0.0867, "lr": 1.1137382304842665e-05, "epoch": 4.77122381477398, "percentage": 68.16, "elapsed_time": "15:27:56", "remaining_time": "7:13:28"}
1732
+ {"current_steps": 8660, "total_steps": 12698, "loss": 0.0872, "lr": 1.1112746805652432e-05, "epoch": 4.773980154355017, "percentage": 68.2, "elapsed_time": "15:28:21", "remaining_time": "7:12:52"}
1733
+ {"current_steps": 8665, "total_steps": 12698, "loss": 0.0945, "lr": 1.1088128097083841e-05, "epoch": 4.776736493936053, "percentage": 68.24, "elapsed_time": "15:28:53", "remaining_time": "7:12:20"}
1734
+ {"current_steps": 8670, "total_steps": 12698, "loss": 0.1065, "lr": 1.106352622564884e-05, "epoch": 4.779492833517089, "percentage": 68.28, "elapsed_time": "15:29:23", "remaining_time": "7:11:47"}
1735
+ {"current_steps": 8675, "total_steps": 12698, "loss": 0.076, "lr": 1.1038941237827565e-05, "epoch": 4.782249173098125, "percentage": 68.32, "elapsed_time": "15:29:44", "remaining_time": "7:11:09"}
1736
+ {"current_steps": 8680, "total_steps": 12698, "loss": 0.1164, "lr": 1.1014373180068246e-05, "epoch": 4.785005512679162, "percentage": 68.36, "elapsed_time": "15:30:09", "remaining_time": "7:10:34"}
1737
+ {"current_steps": 8685, "total_steps": 12698, "loss": 0.0972, "lr": 1.0989822098787126e-05, "epoch": 4.787761852260198, "percentage": 68.4, "elapsed_time": "15:30:41", "remaining_time": "7:10:02"}
1738
+ {"current_steps": 8690, "total_steps": 12698, "loss": 0.0809, "lr": 1.09652880403684e-05, "epoch": 4.790518191841235, "percentage": 68.44, "elapsed_time": "15:31:08", "remaining_time": "7:09:27"}
1739
+ {"current_steps": 8695, "total_steps": 12698, "loss": 0.2349, "lr": 1.0940771051164072e-05, "epoch": 4.793274531422271, "percentage": 68.48, "elapsed_time": "15:31:56", "remaining_time": "7:09:02"}
1740
+ {"current_steps": 8700, "total_steps": 12698, "loss": 0.1189, "lr": 1.0916271177493907e-05, "epoch": 4.796030871003308, "percentage": 68.51, "elapsed_time": "15:32:26", "remaining_time": "7:08:29"}
1741
+ {"current_steps": 8705, "total_steps": 12698, "loss": 0.0964, "lr": 1.0891788465645338e-05, "epoch": 4.798787210584344, "percentage": 68.55, "elapsed_time": "15:33:04", "remaining_time": "7:08:00"}
1742
+ {"current_steps": 8710, "total_steps": 12698, "loss": 0.1726, "lr": 1.0867322961873373e-05, "epoch": 4.8015435501653805, "percentage": 68.59, "elapsed_time": "15:33:54", "remaining_time": "7:07:36"}
1743
+ {"current_steps": 8715, "total_steps": 12698, "loss": 0.0829, "lr": 1.0842874712400499e-05, "epoch": 4.804299889746416, "percentage": 68.63, "elapsed_time": "15:34:22", "remaining_time": "7:07:01"}
1744
+ {"current_steps": 8720, "total_steps": 12698, "loss": 0.0815, "lr": 1.0818443763416622e-05, "epoch": 4.807056229327453, "percentage": 68.67, "elapsed_time": "15:34:57", "remaining_time": "7:06:31"}
1745
+ {"current_steps": 8725, "total_steps": 12698, "loss": 0.0874, "lr": 1.0794030161078948e-05, "epoch": 4.809812568908489, "percentage": 68.71, "elapsed_time": "15:35:25", "remaining_time": "7:05:57"}
1746
+ {"current_steps": 8730, "total_steps": 12698, "loss": 0.0783, "lr": 1.0769633951511915e-05, "epoch": 4.812568908489526, "percentage": 68.75, "elapsed_time": "15:35:50", "remaining_time": "7:05:21"}
1747
+ {"current_steps": 8735, "total_steps": 12698, "loss": 0.0793, "lr": 1.0745255180807094e-05, "epoch": 4.815325248070562, "percentage": 68.79, "elapsed_time": "15:36:20", "remaining_time": "7:04:48"}
1748
+ {"current_steps": 8740, "total_steps": 12698, "loss": 0.0713, "lr": 1.0720893895023134e-05, "epoch": 4.818081587651599, "percentage": 68.83, "elapsed_time": "15:36:41", "remaining_time": "7:04:11"}
1749
+ {"current_steps": 8745, "total_steps": 12698, "loss": 0.0798, "lr": 1.069655014018562e-05, "epoch": 4.820837927232635, "percentage": 68.87, "elapsed_time": "15:37:02", "remaining_time": "7:03:34"}
1750
+ {"current_steps": 8750, "total_steps": 12698, "loss": 0.0697, "lr": 1.067222396228703e-05, "epoch": 4.8235942668136715, "percentage": 68.91, "elapsed_time": "15:37:25", "remaining_time": "7:02:58"}
1751
+ {"current_steps": 8755, "total_steps": 12698, "loss": 0.1141, "lr": 1.0647915407286632e-05, "epoch": 4.8263506063947075, "percentage": 68.95, "elapsed_time": "15:38:08", "remaining_time": "7:02:30"}
1752
+ {"current_steps": 8760, "total_steps": 12698, "loss": 0.0652, "lr": 1.0623624521110397e-05, "epoch": 4.829106945975744, "percentage": 68.99, "elapsed_time": "15:38:30", "remaining_time": "7:01:54"}
1753
+ {"current_steps": 8765, "total_steps": 12698, "loss": 0.0714, "lr": 1.059935134965092e-05, "epoch": 4.83186328555678, "percentage": 69.03, "elapsed_time": "15:38:52", "remaining_time": "7:01:17"}
1754
+ {"current_steps": 8770, "total_steps": 12698, "loss": 0.0703, "lr": 1.057509593876732e-05, "epoch": 4.834619625137817, "percentage": 69.07, "elapsed_time": "15:39:15", "remaining_time": "7:00:41"}
1755
+ {"current_steps": 8775, "total_steps": 12698, "loss": 0.1091, "lr": 1.0550858334285165e-05, "epoch": 4.837375964718853, "percentage": 69.11, "elapsed_time": "15:40:08", "remaining_time": "7:00:18"}
1756
+ {"current_steps": 8780, "total_steps": 12698, "loss": 0.0753, "lr": 1.0526638581996378e-05, "epoch": 4.84013230429989, "percentage": 69.14, "elapsed_time": "15:40:33", "remaining_time": "6:59:42"}
1757
+ {"current_steps": 8785, "total_steps": 12698, "loss": 0.1139, "lr": 1.0502436727659169e-05, "epoch": 4.842888643880926, "percentage": 69.18, "elapsed_time": "15:41:05", "remaining_time": "6:59:10"}
1758
+ {"current_steps": 8790, "total_steps": 12698, "loss": 0.0808, "lr": 1.0478252816997918e-05, "epoch": 4.845644983461963, "percentage": 69.22, "elapsed_time": "15:41:27", "remaining_time": "6:58:34"}
1759
+ {"current_steps": 8795, "total_steps": 12698, "loss": 0.1065, "lr": 1.0454086895703108e-05, "epoch": 4.8484013230429985, "percentage": 69.26, "elapsed_time": "15:42:03", "remaining_time": "6:58:03"}
1760
+ {"current_steps": 8800, "total_steps": 12698, "loss": 0.1076, "lr": 1.0429939009431229e-05, "epoch": 4.851157662624035, "percentage": 69.3, "elapsed_time": "15:42:30", "remaining_time": "6:57:29"}
1761
+ {"current_steps": 8805, "total_steps": 12698, "loss": 0.104, "lr": 1.0405809203804713e-05, "epoch": 4.853914002205071, "percentage": 69.34, "elapsed_time": "15:42:55", "remaining_time": "6:56:54"}
1762
+ {"current_steps": 8810, "total_steps": 12698, "loss": 0.0794, "lr": 1.0381697524411817e-05, "epoch": 4.856670341786108, "percentage": 69.38, "elapsed_time": "15:43:16", "remaining_time": "6:56:16"}
1763
+ {"current_steps": 8815, "total_steps": 12698, "loss": 0.0845, "lr": 1.0357604016806562e-05, "epoch": 4.859426681367144, "percentage": 69.42, "elapsed_time": "15:43:45", "remaining_time": "6:55:43"}
1764
+ {"current_steps": 8820, "total_steps": 12698, "loss": 0.0837, "lr": 1.0333528726508628e-05, "epoch": 4.862183020948181, "percentage": 69.46, "elapsed_time": "15:44:29", "remaining_time": "6:55:16"}
1765
+ {"current_steps": 8825, "total_steps": 12698, "loss": 0.0726, "lr": 1.0309471699003288e-05, "epoch": 4.864939360529217, "percentage": 69.5, "elapsed_time": "15:44:58", "remaining_time": "6:54:42"}
1766
+ {"current_steps": 8830, "total_steps": 12698, "loss": 0.0669, "lr": 1.0285432979741295e-05, "epoch": 4.867695700110254, "percentage": 69.54, "elapsed_time": "15:45:33", "remaining_time": "6:54:12"}
1767
+ {"current_steps": 8835, "total_steps": 12698, "loss": 0.0786, "lr": 1.0261412614138839e-05, "epoch": 4.87045203969129, "percentage": 69.58, "elapsed_time": "15:45:59", "remaining_time": "6:53:37"}
1768
+ {"current_steps": 8840, "total_steps": 12698, "loss": 0.0891, "lr": 1.0237410647577415e-05, "epoch": 4.873208379272326, "percentage": 69.62, "elapsed_time": "15:46:52", "remaining_time": "6:53:14"}
1769
+ {"current_steps": 8845, "total_steps": 12698, "loss": 0.0868, "lr": 1.0213427125403756e-05, "epoch": 4.875964718853362, "percentage": 69.66, "elapsed_time": "15:47:16", "remaining_time": "6:52:38"}
1770
+ {"current_steps": 8850, "total_steps": 12698, "loss": 0.0878, "lr": 1.0189462092929756e-05, "epoch": 4.878721058434399, "percentage": 69.7, "elapsed_time": "15:47:38", "remaining_time": "6:52:02"}
1771
+ {"current_steps": 8855, "total_steps": 12698, "loss": 0.0713, "lr": 1.016551559543237e-05, "epoch": 4.881477398015435, "percentage": 69.74, "elapsed_time": "15:48:05", "remaining_time": "6:51:27"}
1772
+ {"current_steps": 8860, "total_steps": 12698, "loss": 0.0844, "lr": 1.0141587678153542e-05, "epoch": 4.884233737596472, "percentage": 69.77, "elapsed_time": "15:48:39", "remaining_time": "6:50:56"}
1773
+ {"current_steps": 8865, "total_steps": 12698, "loss": 0.0739, "lr": 1.0117678386300107e-05, "epoch": 4.886990077177508, "percentage": 69.81, "elapsed_time": "15:49:02", "remaining_time": "6:50:20"}
1774
+ {"current_steps": 8870, "total_steps": 12698, "loss": 0.0811, "lr": 1.0093787765043715e-05, "epoch": 4.889746416758545, "percentage": 69.85, "elapsed_time": "15:49:27", "remaining_time": "6:49:45"}
1775
+ {"current_steps": 8875, "total_steps": 12698, "loss": 0.0771, "lr": 1.0069915859520726e-05, "epoch": 4.892502756339581, "percentage": 69.89, "elapsed_time": "15:49:52", "remaining_time": "6:49:10"}
1776
+ {"current_steps": 8880, "total_steps": 12698, "loss": 0.0784, "lr": 1.0046062714832176e-05, "epoch": 4.8952590959206175, "percentage": 69.93, "elapsed_time": "15:50:17", "remaining_time": "6:48:35"}
1777
+ {"current_steps": 8885, "total_steps": 12698, "loss": 0.0929, "lr": 1.0022228376043626e-05, "epoch": 4.898015435501653, "percentage": 69.97, "elapsed_time": "15:50:59", "remaining_time": "6:48:07"}
1778
+ {"current_steps": 8890, "total_steps": 12698, "loss": 0.0782, "lr": 9.998412888185117e-06, "epoch": 4.90077177508269, "percentage": 70.01, "elapsed_time": "15:51:19", "remaining_time": "6:47:29"}
1779
+ {"current_steps": 8895, "total_steps": 12698, "loss": 0.0901, "lr": 9.974616296251067e-06, "epoch": 4.903528114663727, "percentage": 70.05, "elapsed_time": "15:51:41", "remaining_time": "6:46:53"}
1780
+ {"current_steps": 8900, "total_steps": 12698, "loss": 0.1003, "lr": 9.950838645200209e-06, "epoch": 4.906284454244763, "percentage": 70.09, "elapsed_time": "15:52:20", "remaining_time": "6:46:24"}
1781
+ {"current_steps": 8905, "total_steps": 12698, "loss": 0.0812, "lr": 9.927079979955479e-06, "epoch": 4.909040793825799, "percentage": 70.13, "elapsed_time": "15:52:45", "remaining_time": "6:45:49"}
1782
+ {"current_steps": 8910, "total_steps": 12698, "loss": 0.0701, "lr": 9.903340345403947e-06, "epoch": 4.911797133406836, "percentage": 70.17, "elapsed_time": "15:53:07", "remaining_time": "6:45:12"}
1783
+ {"current_steps": 8915, "total_steps": 12698, "loss": 0.0848, "lr": 9.87961978639673e-06, "epoch": 4.914553472987873, "percentage": 70.21, "elapsed_time": "15:53:35", "remaining_time": "6:44:38"}
1784
+ {"current_steps": 8920, "total_steps": 12698, "loss": 0.0937, "lr": 9.855918347748905e-06, "epoch": 4.9173098125689085, "percentage": 70.25, "elapsed_time": "15:54:14", "remaining_time": "6:44:09"}
1785
+ {"current_steps": 8925, "total_steps": 12698, "loss": 0.0618, "lr": 9.832236074239415e-06, "epoch": 4.9200661521499445, "percentage": 70.29, "elapsed_time": "15:54:34", "remaining_time": "6:43:32"}
1786
+ {"current_steps": 8930, "total_steps": 12698, "loss": 0.0833, "lr": 9.80857301061102e-06, "epoch": 4.922822491730981, "percentage": 70.33, "elapsed_time": "15:55:16", "remaining_time": "6:43:04"}
1787
+ {"current_steps": 8935, "total_steps": 12698, "loss": 0.0737, "lr": 9.784929201570166e-06, "epoch": 4.925578831312018, "percentage": 70.37, "elapsed_time": "15:55:44", "remaining_time": "6:42:30"}
1788
+ {"current_steps": 8940, "total_steps": 12698, "loss": 0.0645, "lr": 9.761304691786921e-06, "epoch": 4.928335170893054, "percentage": 70.4, "elapsed_time": "15:56:09", "remaining_time": "6:41:55"}
1789
+ {"current_steps": 8945, "total_steps": 12698, "loss": 0.0867, "lr": 9.737699525894902e-06, "epoch": 4.93109151047409, "percentage": 70.44, "elapsed_time": "15:56:35", "remaining_time": "6:41:21"}
1790
+ {"current_steps": 8950, "total_steps": 12698, "loss": 0.0727, "lr": 9.714113748491167e-06, "epoch": 4.933847850055127, "percentage": 70.48, "elapsed_time": "15:57:05", "remaining_time": "6:40:48"}
1791
+ {"current_steps": 8955, "total_steps": 12698, "loss": 0.101, "lr": 9.69054740413616e-06, "epoch": 4.936604189636164, "percentage": 70.52, "elapsed_time": "15:57:36", "remaining_time": "6:40:15"}
1792
+ {"current_steps": 8960, "total_steps": 12698, "loss": 0.0877, "lr": 9.667000537353593e-06, "epoch": 4.9393605292172, "percentage": 70.56, "elapsed_time": "15:58:03", "remaining_time": "6:39:41"}
1793
+ {"current_steps": 8965, "total_steps": 12698, "loss": 0.0929, "lr": 9.643473192630391e-06, "epoch": 4.9421168687982355, "percentage": 70.6, "elapsed_time": "15:58:26", "remaining_time": "6:39:05"}
1794
+ {"current_steps": 8970, "total_steps": 12698, "loss": 0.0736, "lr": 9.61996541441659e-06, "epoch": 4.944873208379272, "percentage": 70.64, "elapsed_time": "15:58:46", "remaining_time": "6:38:28"}
1795
+ {"current_steps": 8975, "total_steps": 12698, "loss": 0.0818, "lr": 9.596477247125253e-06, "epoch": 4.947629547960309, "percentage": 70.68, "elapsed_time": "15:59:10", "remaining_time": "6:37:53"}
1796
+ {"current_steps": 8980, "total_steps": 12698, "loss": 0.0752, "lr": 9.57300873513242e-06, "epoch": 4.950385887541345, "percentage": 70.72, "elapsed_time": "15:59:30", "remaining_time": "6:37:15"}
1797
+ {"current_steps": 8985, "total_steps": 12698, "loss": 0.1011, "lr": 9.549559922776968e-06, "epoch": 4.953142227122381, "percentage": 70.76, "elapsed_time": "16:00:03", "remaining_time": "6:36:44"}
1798
+ {"current_steps": 8990, "total_steps": 12698, "loss": 0.0985, "lr": 9.52613085436056e-06, "epoch": 4.955898566703418, "percentage": 70.8, "elapsed_time": "16:00:45", "remaining_time": "6:36:16"}
1799
+ {"current_steps": 8995, "total_steps": 12698, "loss": 0.0808, "lr": 9.502721574147567e-06, "epoch": 4.958654906284455, "percentage": 70.84, "elapsed_time": "16:01:15", "remaining_time": "6:35:43"}
1800
+ {"current_steps": 9000, "total_steps": 12698, "loss": 0.0784, "lr": 9.479332126364966e-06, "epoch": 4.961411245865491, "percentage": 70.88, "elapsed_time": "16:01:38", "remaining_time": "6:35:07"}
1801
+ {"current_steps": 9005, "total_steps": 12698, "loss": 0.0777, "lr": 9.455962555202267e-06, "epoch": 4.964167585446527, "percentage": 70.92, "elapsed_time": "16:02:41", "remaining_time": "6:34:48"}
1802
+ {"current_steps": 9010, "total_steps": 12698, "loss": 0.0708, "lr": 9.432612904811429e-06, "epoch": 4.966923925027563, "percentage": 70.96, "elapsed_time": "16:03:02", "remaining_time": "6:34:11"}
1803
+ {"current_steps": 9015, "total_steps": 12698, "loss": 0.0781, "lr": 9.409283219306773e-06, "epoch": 4.9696802646086, "percentage": 71.0, "elapsed_time": "16:03:22", "remaining_time": "6:33:34"}
1804
+ {"current_steps": 9020, "total_steps": 12698, "loss": 0.0802, "lr": 9.385973542764895e-06, "epoch": 4.972436604189636, "percentage": 71.03, "elapsed_time": "16:03:45", "remaining_time": "6:32:58"}
1805
+ {"current_steps": 9025, "total_steps": 12698, "loss": 0.0725, "lr": 9.362683919224606e-06, "epoch": 4.975192943770672, "percentage": 71.07, "elapsed_time": "16:04:07", "remaining_time": "6:32:22"}
1806
+ {"current_steps": 9030, "total_steps": 12698, "loss": 0.072, "lr": 9.339414392686816e-06, "epoch": 4.977949283351709, "percentage": 71.11, "elapsed_time": "16:04:32", "remaining_time": "6:31:47"}
1807
+ {"current_steps": 9035, "total_steps": 12698, "loss": 0.0816, "lr": 9.316165007114469e-06, "epoch": 4.980705622932746, "percentage": 71.15, "elapsed_time": "16:04:55", "remaining_time": "6:31:12"}
1808
+ {"current_steps": 9040, "total_steps": 12698, "loss": 0.068, "lr": 9.29293580643245e-06, "epoch": 4.983461962513782, "percentage": 71.19, "elapsed_time": "16:05:36", "remaining_time": "6:30:43"}
1809
+ {"current_steps": 9045, "total_steps": 12698, "loss": 0.0738, "lr": 9.269726834527524e-06, "epoch": 4.986218302094818, "percentage": 71.23, "elapsed_time": "16:06:05", "remaining_time": "6:30:10"}
1810
+ {"current_steps": 9050, "total_steps": 12698, "loss": 0.0748, "lr": 9.246538135248227e-06, "epoch": 4.9889746416758545, "percentage": 71.27, "elapsed_time": "16:06:46", "remaining_time": "6:29:41"}
1811
+ {"current_steps": 9055, "total_steps": 12698, "loss": 0.159, "lr": 9.223369752404794e-06, "epoch": 4.991730981256891, "percentage": 71.31, "elapsed_time": "16:07:50", "remaining_time": "6:29:22"}
1812
+ {"current_steps": 9060, "total_steps": 12698, "loss": 0.0737, "lr": 9.200221729769084e-06, "epoch": 4.994487320837927, "percentage": 71.35, "elapsed_time": "16:08:16", "remaining_time": "6:28:48"}
1813
+ {"current_steps": 9065, "total_steps": 12698, "loss": 0.0756, "lr": 9.17709411107448e-06, "epoch": 4.997243660418963, "percentage": 71.39, "elapsed_time": "16:08:46", "remaining_time": "6:28:15"}
1814
+ {"current_steps": 9070, "total_steps": 12698, "loss": 0.1049, "lr": 9.153986940015817e-06, "epoch": 5.0, "percentage": 71.43, "elapsed_time": "16:09:29", "remaining_time": "6:27:47"}
1815
+ {"current_steps": 9075, "total_steps": 12698, "loss": 0.1893, "lr": 9.130900260249315e-06, "epoch": 5.002756339581037, "percentage": 71.47, "elapsed_time": "16:10:42", "remaining_time": "6:27:32"}
1816
+ {"current_steps": 9080, "total_steps": 12698, "loss": 0.1812, "lr": 9.10783411539246e-06, "epoch": 5.005512679162073, "percentage": 71.51, "elapsed_time": "16:11:51", "remaining_time": "6:27:14"}
1817
+ {"current_steps": 9085, "total_steps": 12698, "loss": 0.173, "lr": 9.084788549023951e-06, "epoch": 5.00826901874311, "percentage": 71.55, "elapsed_time": "16:13:07", "remaining_time": "6:26:59"}
1818
+ {"current_steps": 9090, "total_steps": 12698, "loss": 0.1688, "lr": 9.061763604683603e-06, "epoch": 5.0110253583241455, "percentage": 71.59, "elapsed_time": "16:14:25", "remaining_time": "6:26:46"}