Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e3def204bff1027c39582461a2b78d9b8d4653d1d72079a0075bc00207649f5
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:001611a4ce0df0471d0e5b16a053688fd9ef0d69c6b355aa6f6e9ed83d43258d
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fb81590d51abedb9159cb15e744731f048a18f193d994057ba6a0e0135e4d28
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f83d36ab52187bbcf4f9256f8fafe0b15d981ab4053d449e6f5179c77f294a4d
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -500,3 +500,252 @@
|
|
500 |
{"current_steps": 500, "total_steps": 750, "loss": 0.7982, "lr": 3.019601169804216e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "7:46:11", "remaining_time": "3:53:05"}
|
501 |
{"current_steps": 501, "total_steps": 750, "loss": 0.7587, "lr": 2.9982548372155264e-06, "epoch": 2.004, "percentage": 66.8, "elapsed_time": "7:48:10", "remaining_time": "3:52:40"}
|
502 |
{"current_steps": 502, "total_steps": 750, "loss": 0.7893, "lr": 2.9769518657180953e-06, "epoch": 2.008, "percentage": 66.93, "elapsed_time": "7:49:01", "remaining_time": "3:51:42"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
500 |
{"current_steps": 500, "total_steps": 750, "loss": 0.7982, "lr": 3.019601169804216e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "7:46:11", "remaining_time": "3:53:05"}
|
501 |
{"current_steps": 501, "total_steps": 750, "loss": 0.7587, "lr": 2.9982548372155264e-06, "epoch": 2.004, "percentage": 66.8, "elapsed_time": "7:48:10", "remaining_time": "3:52:40"}
|
502 |
{"current_steps": 502, "total_steps": 750, "loss": 0.7893, "lr": 2.9769518657180953e-06, "epoch": 2.008, "percentage": 66.93, "elapsed_time": "7:49:01", "remaining_time": "3:51:42"}
|
503 |
+
{"current_steps": 503, "total_steps": 750, "loss": 0.782, "lr": 2.9556927167693107e-06, "epoch": 2.012, "percentage": 67.07, "elapsed_time": "7:50:04", "remaining_time": "3:50:50"}
|
504 |
+
{"current_steps": 504, "total_steps": 750, "loss": 0.7916, "lr": 2.934477850877292e-06, "epoch": 2.016, "percentage": 67.2, "elapsed_time": "7:50:58", "remaining_time": "3:49:53"}
|
505 |
+
{"current_steps": 505, "total_steps": 750, "loss": 0.7631, "lr": 2.9133077275909112e-06, "epoch": 2.02, "percentage": 67.33, "elapsed_time": "7:51:47", "remaining_time": "3:48:53"}
|
506 |
+
{"current_steps": 506, "total_steps": 750, "loss": 0.7966, "lr": 2.892182805489846e-06, "epoch": 2.024, "percentage": 67.47, "elapsed_time": "7:52:45", "remaining_time": "3:47:58"}
|
507 |
+
{"current_steps": 507, "total_steps": 750, "loss": 0.81, "lr": 2.871103542174637e-06, "epoch": 2.028, "percentage": 67.6, "elapsed_time": "7:53:39", "remaining_time": "3:47:01"}
|
508 |
+
{"current_steps": 508, "total_steps": 750, "loss": 0.7654, "lr": 2.8500703942567874e-06, "epoch": 2.032, "percentage": 67.73, "elapsed_time": "7:54:30", "remaining_time": "3:46:02"}
|
509 |
+
{"current_steps": 509, "total_steps": 750, "loss": 0.7834, "lr": 2.82908381734886e-06, "epoch": 2.036, "percentage": 67.87, "elapsed_time": "7:55:24", "remaining_time": "3:45:05"}
|
510 |
+
{"current_steps": 510, "total_steps": 750, "loss": 0.8032, "lr": 2.8081442660546126e-06, "epoch": 2.04, "percentage": 68.0, "elapsed_time": "7:56:26", "remaining_time": "3:44:12"}
|
511 |
+
{"current_steps": 511, "total_steps": 750, "loss": 0.7803, "lr": 2.7872521939591556e-06, "epoch": 2.044, "percentage": 68.13, "elapsed_time": "7:57:26", "remaining_time": "3:43:18"}
|
512 |
+
{"current_steps": 512, "total_steps": 750, "loss": 0.7928, "lr": 2.7664080536191178e-06, "epoch": 2.048, "percentage": 68.27, "elapsed_time": "7:58:20", "remaining_time": "3:42:21"}
|
513 |
+
{"current_steps": 513, "total_steps": 750, "loss": 0.7821, "lr": 2.7456122965528475e-06, "epoch": 2.052, "percentage": 68.4, "elapsed_time": "7:59:21", "remaining_time": "3:41:27"}
|
514 |
+
{"current_steps": 514, "total_steps": 750, "loss": 0.7755, "lr": 2.724865373230632e-06, "epoch": 2.056, "percentage": 68.53, "elapsed_time": "8:00:17", "remaining_time": "3:40:31"}
|
515 |
+
{"current_steps": 515, "total_steps": 750, "loss": 0.7647, "lr": 2.7041677330649408e-06, "epoch": 2.06, "percentage": 68.67, "elapsed_time": "8:01:08", "remaining_time": "3:39:33"}
|
516 |
+
{"current_steps": 516, "total_steps": 750, "loss": 0.7806, "lr": 2.683519824400693e-06, "epoch": 2.064, "percentage": 68.8, "elapsed_time": "8:02:03", "remaining_time": "3:38:36"}
|
517 |
+
{"current_steps": 517, "total_steps": 750, "loss": 0.7562, "lr": 2.662922094505529e-06, "epoch": 2.068, "percentage": 68.93, "elapsed_time": "8:02:55", "remaining_time": "3:37:38"}
|
518 |
+
{"current_steps": 518, "total_steps": 750, "loss": 0.7736, "lr": 2.6423749895601494e-06, "epoch": 2.072, "percentage": 69.07, "elapsed_time": "8:03:47", "remaining_time": "3:36:40"}
|
519 |
+
{"current_steps": 519, "total_steps": 750, "loss": 0.7694, "lr": 2.6218789546486235e-06, "epoch": 2.076, "percentage": 69.2, "elapsed_time": "8:04:46", "remaining_time": "3:35:46"}
|
520 |
+
{"current_steps": 520, "total_steps": 750, "loss": 0.7603, "lr": 2.601434433748771e-06, "epoch": 2.08, "percentage": 69.33, "elapsed_time": "8:05:44", "remaining_time": "3:34:50"}
|
521 |
+
{"current_steps": 521, "total_steps": 750, "loss": 0.8048, "lr": 2.581041869722519e-06, "epoch": 2.084, "percentage": 69.47, "elapsed_time": "8:06:44", "remaining_time": "3:33:56"}
|
522 |
+
{"current_steps": 522, "total_steps": 750, "loss": 0.754, "lr": 2.560701704306336e-06, "epoch": 2.088, "percentage": 69.6, "elapsed_time": "8:07:37", "remaining_time": "3:32:58"}
|
523 |
+
{"current_steps": 523, "total_steps": 750, "loss": 0.7941, "lr": 2.540414378101647e-06, "epoch": 2.092, "percentage": 69.73, "elapsed_time": "8:08:35", "remaining_time": "3:32:04"}
|
524 |
+
{"current_steps": 524, "total_steps": 750, "loss": 0.7982, "lr": 2.52018033056529e-06, "epoch": 2.096, "percentage": 69.87, "elapsed_time": "8:09:27", "remaining_time": "3:31:06"}
|
525 |
+
{"current_steps": 525, "total_steps": 750, "loss": 0.7704, "lr": 2.5000000000000015e-06, "epoch": 2.1, "percentage": 70.0, "elapsed_time": "8:10:22", "remaining_time": "3:30:09"}
|
526 |
+
{"current_steps": 526, "total_steps": 750, "loss": 0.7626, "lr": 2.4798738235449164e-06, "epoch": 2.104, "percentage": 70.13, "elapsed_time": "8:11:17", "remaining_time": "3:29:12"}
|
527 |
+
{"current_steps": 527, "total_steps": 750, "loss": 0.7781, "lr": 2.4598022371661113e-06, "epoch": 2.108, "percentage": 70.27, "elapsed_time": "8:12:22", "remaining_time": "3:28:20"}
|
528 |
+
{"current_steps": 528, "total_steps": 750, "loss": 0.7615, "lr": 2.4397856756471435e-06, "epoch": 2.112, "percentage": 70.4, "elapsed_time": "8:13:14", "remaining_time": "3:27:23"}
|
529 |
+
{"current_steps": 529, "total_steps": 750, "loss": 0.781, "lr": 2.4198245725796427e-06, "epoch": 2.116, "percentage": 70.53, "elapsed_time": "8:14:23", "remaining_time": "3:26:32"}
|
530 |
+
{"current_steps": 530, "total_steps": 750, "loss": 0.7935, "lr": 2.3999193603539234e-06, "epoch": 2.12, "percentage": 70.67, "elapsed_time": "8:15:26", "remaining_time": "3:25:39"}
|
531 |
+
{"current_steps": 531, "total_steps": 750, "loss": 0.7558, "lr": 2.380070470149605e-06, "epoch": 2.124, "percentage": 70.8, "elapsed_time": "8:16:14", "remaining_time": "3:24:39"}
|
532 |
+
{"current_steps": 532, "total_steps": 750, "loss": 0.7801, "lr": 2.3602783319262847e-06, "epoch": 2.128, "percentage": 70.93, "elapsed_time": "8:17:13", "remaining_time": "3:23:45"}
|
533 |
+
{"current_steps": 533, "total_steps": 750, "loss": 0.7615, "lr": 2.340543374414212e-06, "epoch": 2.132, "percentage": 71.07, "elapsed_time": "8:18:02", "remaining_time": "3:22:46"}
|
534 |
+
{"current_steps": 534, "total_steps": 750, "loss": 0.7831, "lr": 2.320866025105016e-06, "epoch": 2.136, "percentage": 71.2, "elapsed_time": "8:18:58", "remaining_time": "3:21:49"}
|
535 |
+
{"current_steps": 535, "total_steps": 750, "loss": 0.7642, "lr": 2.3012467102424373e-06, "epoch": 2.14, "percentage": 71.33, "elapsed_time": "8:19:54", "remaining_time": "3:20:53"}
|
536 |
+
{"current_steps": 536, "total_steps": 750, "loss": 0.7502, "lr": 2.2816858548130837e-06, "epoch": 2.144, "percentage": 71.47, "elapsed_time": "8:20:48", "remaining_time": "3:19:57"}
|
537 |
+
{"current_steps": 537, "total_steps": 750, "loss": 0.7878, "lr": 2.2621838825372496e-06, "epoch": 2.148, "percentage": 71.6, "elapsed_time": "8:21:44", "remaining_time": "3:19:00"}
|
538 |
+
{"current_steps": 538, "total_steps": 750, "loss": 0.8084, "lr": 2.2427412158597133e-06, "epoch": 2.152, "percentage": 71.73, "elapsed_time": "8:22:41", "remaining_time": "3:18:05"}
|
539 |
+
{"current_steps": 539, "total_steps": 750, "loss": 0.7675, "lr": 2.2233582759406065e-06, "epoch": 2.156, "percentage": 71.87, "elapsed_time": "8:23:36", "remaining_time": "3:17:08"}
|
540 |
+
{"current_steps": 540, "total_steps": 750, "loss": 0.7903, "lr": 2.204035482646267e-06, "epoch": 2.16, "percentage": 72.0, "elapsed_time": "8:24:44", "remaining_time": "3:16:17"}
|
541 |
+
{"current_steps": 541, "total_steps": 750, "loss": 0.7992, "lr": 2.184773254540169e-06, "epoch": 2.164, "percentage": 72.13, "elapsed_time": "8:25:50", "remaining_time": "3:15:24"}
|
542 |
+
{"current_steps": 542, "total_steps": 750, "loss": 0.7768, "lr": 2.165572008873845e-06, "epoch": 2.168, "percentage": 72.27, "elapsed_time": "8:26:44", "remaining_time": "3:14:27"}
|
543 |
+
{"current_steps": 543, "total_steps": 750, "loss": 0.7797, "lr": 2.146432161577842e-06, "epoch": 2.172, "percentage": 72.4, "elapsed_time": "8:27:36", "remaining_time": "3:13:30"}
|
544 |
+
{"current_steps": 544, "total_steps": 750, "loss": 0.7717, "lr": 2.12735412725272e-06, "epoch": 2.176, "percentage": 72.53, "elapsed_time": "8:28:30", "remaining_time": "3:12:33"}
|
545 |
+
{"current_steps": 545, "total_steps": 750, "loss": 0.752, "lr": 2.1083383191600676e-06, "epoch": 2.18, "percentage": 72.67, "elapsed_time": "8:29:24", "remaining_time": "3:11:36"}
|
546 |
+
{"current_steps": 546, "total_steps": 750, "loss": 0.7791, "lr": 2.0893851492135536e-06, "epoch": 2.184, "percentage": 72.8, "elapsed_time": "8:30:19", "remaining_time": "3:10:40"}
|
547 |
+
{"current_steps": 547, "total_steps": 750, "loss": 0.7951, "lr": 2.0704950279699986e-06, "epoch": 2.188, "percentage": 72.93, "elapsed_time": "8:31:15", "remaining_time": "3:09:44"}
|
548 |
+
{"current_steps": 548, "total_steps": 750, "loss": 0.7639, "lr": 2.0516683646204836e-06, "epoch": 2.192, "percentage": 73.07, "elapsed_time": "8:32:10", "remaining_time": "3:08:47"}
|
549 |
+
{"current_steps": 549, "total_steps": 750, "loss": 0.7593, "lr": 2.0329055669814936e-06, "epoch": 2.196, "percentage": 73.2, "elapsed_time": "8:33:08", "remaining_time": "3:07:52"}
|
550 |
+
{"current_steps": 550, "total_steps": 750, "loss": 0.8132, "lr": 2.0142070414860704e-06, "epoch": 2.2, "percentage": 73.33, "elapsed_time": "8:34:11", "remaining_time": "3:06:58"}
|
551 |
+
{"current_steps": 551, "total_steps": 750, "loss": 0.7773, "lr": 1.9955731931750182e-06, "epoch": 2.204, "percentage": 73.47, "elapsed_time": "8:35:16", "remaining_time": "3:06:05"}
|
552 |
+
{"current_steps": 552, "total_steps": 750, "loss": 0.7781, "lr": 1.977004425688126e-06, "epoch": 2.208, "percentage": 73.6, "elapsed_time": "8:36:06", "remaining_time": "3:05:07"}
|
553 |
+
{"current_steps": 553, "total_steps": 750, "loss": 0.8189, "lr": 1.958501141255427e-06, "epoch": 2.212, "percentage": 73.73, "elapsed_time": "8:37:03", "remaining_time": "3:04:11"}
|
554 |
+
{"current_steps": 554, "total_steps": 750, "loss": 0.7639, "lr": 1.9400637406884875e-06, "epoch": 2.216, "percentage": 73.87, "elapsed_time": "8:38:03", "remaining_time": "3:03:17"}
|
555 |
+
{"current_steps": 555, "total_steps": 750, "loss": 0.767, "lr": 1.9216926233717087e-06, "epoch": 2.22, "percentage": 74.0, "elapsed_time": "8:38:56", "remaining_time": "3:02:19"}
|
556 |
+
{"current_steps": 556, "total_steps": 750, "loss": 0.7658, "lr": 1.9033881872537009e-06, "epoch": 2.224, "percentage": 74.13, "elapsed_time": "8:39:49", "remaining_time": "3:01:22"}
|
557 |
+
{"current_steps": 557, "total_steps": 750, "loss": 0.7824, "lr": 1.88515082883864e-06, "epoch": 2.228, "percentage": 74.27, "elapsed_time": "8:40:45", "remaining_time": "3:00:26"}
|
558 |
+
{"current_steps": 558, "total_steps": 750, "loss": 0.8217, "lr": 1.8669809431776991e-06, "epoch": 2.232, "percentage": 74.4, "elapsed_time": "8:41:50", "remaining_time": "2:59:33"}
|
559 |
+
{"current_steps": 559, "total_steps": 750, "loss": 0.8179, "lr": 1.8488789238604676e-06, "epoch": 2.2359999999999998, "percentage": 74.53, "elapsed_time": "8:42:54", "remaining_time": "2:58:40"}
|
560 |
+
{"current_steps": 560, "total_steps": 750, "loss": 0.8095, "lr": 1.8308451630064484e-06, "epoch": 2.24, "percentage": 74.67, "elapsed_time": "8:43:52", "remaining_time": "2:57:44"}
|
561 |
+
{"current_steps": 561, "total_steps": 750, "loss": 0.7891, "lr": 1.8128800512565514e-06, "epoch": 2.2439999999999998, "percentage": 74.8, "elapsed_time": "8:44:48", "remaining_time": "2:56:48"}
|
562 |
+
{"current_steps": 562, "total_steps": 750, "loss": 0.805, "lr": 1.7949839777646327e-06, "epoch": 2.248, "percentage": 74.93, "elapsed_time": "8:45:51", "remaining_time": "2:55:54"}
|
563 |
+
{"current_steps": 563, "total_steps": 750, "loss": 0.7491, "lr": 1.7771573301890666e-06, "epoch": 2.252, "percentage": 75.07, "elapsed_time": "8:46:37", "remaining_time": "2:54:55"}
|
564 |
+
{"current_steps": 564, "total_steps": 750, "loss": 0.7802, "lr": 1.7594004946843458e-06, "epoch": 2.2560000000000002, "percentage": 75.2, "elapsed_time": "8:47:40", "remaining_time": "2:54:01"}
|
565 |
+
{"current_steps": 565, "total_steps": 750, "loss": 0.7608, "lr": 1.7417138558927244e-06, "epoch": 2.26, "percentage": 75.33, "elapsed_time": "8:48:25", "remaining_time": "2:53:01"}
|
566 |
+
{"current_steps": 566, "total_steps": 750, "loss": 0.7541, "lr": 1.7240977969358757e-06, "epoch": 2.2640000000000002, "percentage": 75.47, "elapsed_time": "8:49:21", "remaining_time": "2:52:05"}
|
567 |
+
{"current_steps": 567, "total_steps": 750, "loss": 0.7967, "lr": 1.7065526994065973e-06, "epoch": 2.268, "percentage": 75.6, "elapsed_time": "8:50:18", "remaining_time": "2:51:09"}
|
568 |
+
{"current_steps": 568, "total_steps": 750, "loss": 0.7817, "lr": 1.6890789433605508e-06, "epoch": 2.2720000000000002, "percentage": 75.73, "elapsed_time": "8:51:18", "remaining_time": "2:50:14"}
|
569 |
+
{"current_steps": 569, "total_steps": 750, "loss": 0.7586, "lr": 1.671676907308018e-06, "epoch": 2.276, "percentage": 75.87, "elapsed_time": "8:52:12", "remaining_time": "2:49:17"}
|
570 |
+
{"current_steps": 570, "total_steps": 750, "loss": 0.7612, "lr": 1.6543469682057105e-06, "epoch": 2.2800000000000002, "percentage": 76.0, "elapsed_time": "8:53:03", "remaining_time": "2:48:20"}
|
571 |
+
{"current_steps": 571, "total_steps": 750, "loss": 0.7828, "lr": 1.6370895014486e-06, "epoch": 2.284, "percentage": 76.13, "elapsed_time": "8:53:53", "remaining_time": "2:47:22"}
|
572 |
+
{"current_steps": 572, "total_steps": 750, "loss": 0.7579, "lr": 1.6199048808617896e-06, "epoch": 2.288, "percentage": 76.27, "elapsed_time": "8:54:39", "remaining_time": "2:46:22"}
|
573 |
+
{"current_steps": 573, "total_steps": 750, "loss": 0.7288, "lr": 1.6027934786924187e-06, "epoch": 2.292, "percentage": 76.4, "elapsed_time": "8:55:29", "remaining_time": "2:45:24"}
|
574 |
+
{"current_steps": 574, "total_steps": 750, "loss": 0.7974, "lr": 1.5857556656015837e-06, "epoch": 2.296, "percentage": 76.53, "elapsed_time": "8:56:26", "remaining_time": "2:44:28"}
|
575 |
+
{"current_steps": 575, "total_steps": 750, "loss": 0.8026, "lr": 1.5687918106563326e-06, "epoch": 2.3, "percentage": 76.67, "elapsed_time": "8:57:27", "remaining_time": "2:43:34"}
|
576 |
+
{"current_steps": 576, "total_steps": 750, "loss": 0.7705, "lr": 1.551902281321651e-06, "epoch": 2.304, "percentage": 76.8, "elapsed_time": "8:58:26", "remaining_time": "2:42:39"}
|
577 |
+
{"current_steps": 577, "total_steps": 750, "loss": 0.79, "lr": 1.5350874434525142e-06, "epoch": 2.308, "percentage": 76.93, "elapsed_time": "8:59:25", "remaining_time": "2:41:43"}
|
578 |
+
{"current_steps": 578, "total_steps": 750, "loss": 0.7796, "lr": 1.5183476612859538e-06, "epoch": 2.312, "percentage": 77.07, "elapsed_time": "9:00:20", "remaining_time": "2:40:47"}
|
579 |
+
{"current_steps": 579, "total_steps": 750, "loss": 0.7863, "lr": 1.5016832974331725e-06, "epoch": 2.316, "percentage": 77.2, "elapsed_time": "9:01:17", "remaining_time": "2:39:51"}
|
580 |
+
{"current_steps": 580, "total_steps": 750, "loss": 0.7793, "lr": 1.4850947128716914e-06, "epoch": 2.32, "percentage": 77.33, "elapsed_time": "9:02:12", "remaining_time": "2:38:55"}
|
581 |
+
{"current_steps": 581, "total_steps": 750, "loss": 0.7962, "lr": 1.4685822669375239e-06, "epoch": 2.324, "percentage": 77.47, "elapsed_time": "9:03:14", "remaining_time": "2:38:00"}
|
582 |
+
{"current_steps": 582, "total_steps": 750, "loss": 0.7752, "lr": 1.4521463173173966e-06, "epoch": 2.328, "percentage": 77.6, "elapsed_time": "9:04:13", "remaining_time": "2:37:05"}
|
583 |
+
{"current_steps": 583, "total_steps": 750, "loss": 0.7563, "lr": 1.4357872200409988e-06, "epoch": 2.332, "percentage": 77.73, "elapsed_time": "9:05:08", "remaining_time": "2:36:09"}
|
584 |
+
{"current_steps": 584, "total_steps": 750, "loss": 0.7666, "lr": 1.4195053294732757e-06, "epoch": 2.336, "percentage": 77.87, "elapsed_time": "9:05:50", "remaining_time": "2:35:09"}
|
585 |
+
{"current_steps": 585, "total_steps": 750, "loss": 0.8055, "lr": 1.4033009983067454e-06, "epoch": 2.34, "percentage": 78.0, "elapsed_time": "9:06:46", "remaining_time": "2:34:12"}
|
586 |
+
{"current_steps": 586, "total_steps": 750, "loss": 0.7531, "lr": 1.3871745775538598e-06, "epoch": 2.344, "percentage": 78.13, "elapsed_time": "9:07:45", "remaining_time": "2:33:17"}
|
587 |
+
{"current_steps": 587, "total_steps": 750, "loss": 0.7978, "lr": 1.371126416539409e-06, "epoch": 2.348, "percentage": 78.27, "elapsed_time": "9:08:50", "remaining_time": "2:32:24"}
|
588 |
+
{"current_steps": 588, "total_steps": 750, "loss": 0.7487, "lr": 1.3551568628929434e-06, "epoch": 2.352, "percentage": 78.4, "elapsed_time": "9:09:46", "remaining_time": "2:31:28"}
|
589 |
+
{"current_steps": 589, "total_steps": 750, "loss": 0.7962, "lr": 1.339266262541249e-06, "epoch": 2.356, "percentage": 78.53, "elapsed_time": "9:10:44", "remaining_time": "2:30:32"}
|
590 |
+
{"current_steps": 590, "total_steps": 750, "loss": 0.7901, "lr": 1.3234549597008572e-06, "epoch": 2.36, "percentage": 78.67, "elapsed_time": "9:11:41", "remaining_time": "2:29:36"}
|
591 |
+
{"current_steps": 591, "total_steps": 750, "loss": 0.7982, "lr": 1.3077232968705805e-06, "epoch": 2.364, "percentage": 78.8, "elapsed_time": "9:12:38", "remaining_time": "2:28:40"}
|
592 |
+
{"current_steps": 592, "total_steps": 750, "loss": 0.7654, "lr": 1.2920716148241036e-06, "epoch": 2.368, "percentage": 78.93, "elapsed_time": "9:13:38", "remaining_time": "2:27:45"}
|
593 |
+
{"current_steps": 593, "total_steps": 750, "loss": 0.7895, "lr": 1.2765002526025871e-06, "epoch": 2.372, "percentage": 79.07, "elapsed_time": "9:14:35", "remaining_time": "2:26:49"}
|
594 |
+
{"current_steps": 594, "total_steps": 750, "loss": 0.7466, "lr": 1.2610095475073415e-06, "epoch": 2.376, "percentage": 79.2, "elapsed_time": "9:15:30", "remaining_time": "2:25:53"}
|
595 |
+
{"current_steps": 595, "total_steps": 750, "loss": 0.7965, "lr": 1.2455998350925042e-06, "epoch": 2.38, "percentage": 79.33, "elapsed_time": "9:16:32", "remaining_time": "2:24:58"}
|
596 |
+
{"current_steps": 596, "total_steps": 750, "loss": 0.7675, "lr": 1.2302714491577834e-06, "epoch": 2.384, "percentage": 79.47, "elapsed_time": "9:17:29", "remaining_time": "2:24:03"}
|
597 |
+
{"current_steps": 597, "total_steps": 750, "loss": 0.7693, "lr": 1.2150247217412186e-06, "epoch": 2.388, "percentage": 79.6, "elapsed_time": "9:18:16", "remaining_time": "2:23:04"}
|
598 |
+
{"current_steps": 598, "total_steps": 750, "loss": 0.7664, "lr": 1.1998599831119912e-06, "epoch": 2.392, "percentage": 79.73, "elapsed_time": "9:19:19", "remaining_time": "2:22:10"}
|
599 |
+
{"current_steps": 599, "total_steps": 750, "loss": 0.7766, "lr": 1.1847775617632746e-06, "epoch": 2.396, "percentage": 79.87, "elapsed_time": "9:20:18", "remaining_time": "2:21:14"}
|
600 |
+
{"current_steps": 600, "total_steps": 750, "loss": 0.779, "lr": 1.1697777844051105e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "9:21:19", "remaining_time": "2:20:19"}
|
601 |
+
{"current_steps": 601, "total_steps": 750, "loss": 0.7929, "lr": 1.1548609759573375e-06, "epoch": 2.404, "percentage": 80.13, "elapsed_time": "9:22:20", "remaining_time": "2:19:24"}
|
602 |
+
{"current_steps": 602, "total_steps": 750, "loss": 0.7581, "lr": 1.1400274595425499e-06, "epoch": 2.408, "percentage": 80.27, "elapsed_time": "9:23:13", "remaining_time": "2:18:28"}
|
603 |
+
{"current_steps": 603, "total_steps": 750, "loss": 0.7649, "lr": 1.1252775564791023e-06, "epoch": 2.412, "percentage": 80.4, "elapsed_time": "9:24:05", "remaining_time": "2:17:30"}
|
604 |
+
{"current_steps": 604, "total_steps": 750, "loss": 0.7938, "lr": 1.1106115862741457e-06, "epoch": 2.416, "percentage": 80.53, "elapsed_time": "9:25:07", "remaining_time": "2:16:36"}
|
605 |
+
{"current_steps": 605, "total_steps": 750, "loss": 0.7637, "lr": 1.096029866616704e-06, "epoch": 2.42, "percentage": 80.67, "elapsed_time": "9:26:08", "remaining_time": "2:15:41"}
|
606 |
+
{"current_steps": 606, "total_steps": 750, "loss": 0.7722, "lr": 1.0815327133708015e-06, "epoch": 2.424, "percentage": 80.8, "elapsed_time": "9:26:57", "remaining_time": "2:14:43"}
|
607 |
+
{"current_steps": 607, "total_steps": 750, "loss": 0.7867, "lr": 1.0671204405686108e-06, "epoch": 2.428, "percentage": 80.93, "elapsed_time": "9:27:51", "remaining_time": "2:13:46"}
|
608 |
+
{"current_steps": 608, "total_steps": 750, "loss": 0.8015, "lr": 1.052793360403655e-06, "epoch": 2.432, "percentage": 81.07, "elapsed_time": "9:28:50", "remaining_time": "2:12:51"}
|
609 |
+
{"current_steps": 609, "total_steps": 750, "loss": 0.7635, "lr": 1.0385517832240472e-06, "epoch": 2.436, "percentage": 81.2, "elapsed_time": "9:29:47", "remaining_time": "2:11:55"}
|
610 |
+
{"current_steps": 610, "total_steps": 750, "loss": 0.8132, "lr": 1.0243960175257605e-06, "epoch": 2.44, "percentage": 81.33, "elapsed_time": "9:30:43", "remaining_time": "2:10:59"}
|
611 |
+
{"current_steps": 611, "total_steps": 750, "loss": 0.7571, "lr": 1.010326369945957e-06, "epoch": 2.444, "percentage": 81.47, "elapsed_time": "9:31:33", "remaining_time": "2:10:01"}
|
612 |
+
{"current_steps": 612, "total_steps": 750, "loss": 0.7628, "lr": 9.963431452563331e-07, "epoch": 2.448, "percentage": 81.6, "elapsed_time": "9:32:20", "remaining_time": "2:09:03"}
|
613 |
+
{"current_steps": 613, "total_steps": 750, "loss": 0.787, "lr": 9.824466463565246e-07, "epoch": 2.452, "percentage": 81.73, "elapsed_time": "9:33:16", "remaining_time": "2:08:07"}
|
614 |
+
{"current_steps": 614, "total_steps": 750, "loss": 0.7998, "lr": 9.686371742675443e-07, "epoch": 2.456, "percentage": 81.87, "elapsed_time": "9:34:04", "remaining_time": "2:07:09"}
|
615 |
+
{"current_steps": 615, "total_steps": 750, "loss": 0.7981, "lr": 9.549150281252633e-07, "epoch": 2.46, "percentage": 82.0, "elapsed_time": "9:34:55", "remaining_time": "2:06:12"}
|
616 |
+
{"current_steps": 616, "total_steps": 750, "loss": 0.7642, "lr": 9.412805051739266e-07, "epoch": 2.464, "percentage": 82.13, "elapsed_time": "9:35:51", "remaining_time": "2:05:16"}
|
617 |
+
{"current_steps": 617, "total_steps": 750, "loss": 0.784, "lr": 9.277339007597158e-07, "epoch": 2.468, "percentage": 82.27, "elapsed_time": "9:36:45", "remaining_time": "2:04:19"}
|
618 |
+
{"current_steps": 618, "total_steps": 750, "loss": 0.7681, "lr": 9.142755083243577e-07, "epoch": 2.472, "percentage": 82.4, "elapsed_time": "9:37:44", "remaining_time": "2:03:24"}
|
619 |
+
{"current_steps": 619, "total_steps": 750, "loss": 0.7979, "lr": 9.009056193987569e-07, "epoch": 2.476, "percentage": 82.53, "elapsed_time": "9:38:54", "remaining_time": "2:02:30"}
|
620 |
+
{"current_steps": 620, "total_steps": 750, "loss": 0.7802, "lr": 8.876245235966884e-07, "epoch": 2.48, "percentage": 82.67, "elapsed_time": "9:39:58", "remaining_time": "2:01:36"}
|
621 |
+
{"current_steps": 621, "total_steps": 750, "loss": 0.7582, "lr": 8.744325086085248e-07, "epoch": 2.484, "percentage": 82.8, "elapsed_time": "9:40:53", "remaining_time": "2:00:39"}
|
622 |
+
{"current_steps": 622, "total_steps": 750, "loss": 0.7943, "lr": 8.613298601949971e-07, "epoch": 2.488, "percentage": 82.93, "elapsed_time": "9:41:48", "remaining_time": "1:59:43"}
|
623 |
+
{"current_steps": 623, "total_steps": 750, "loss": 0.799, "lr": 8.483168621810133e-07, "epoch": 2.492, "percentage": 83.07, "elapsed_time": "9:42:49", "remaining_time": "1:58:48"}
|
624 |
+
{"current_steps": 624, "total_steps": 750, "loss": 0.747, "lr": 8.353937964495029e-07, "epoch": 2.496, "percentage": 83.2, "elapsed_time": "9:43:38", "remaining_time": "1:57:51"}
|
625 |
+
{"current_steps": 625, "total_steps": 750, "loss": 0.772, "lr": 8.225609429353187e-07, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "9:44:24", "remaining_time": "1:56:52"}
|
626 |
+
{"current_steps": 626, "total_steps": 750, "loss": 0.7802, "lr": 8.098185796191632e-07, "epoch": 2.504, "percentage": 83.47, "elapsed_time": "9:45:12", "remaining_time": "1:55:55"}
|
627 |
+
{"current_steps": 627, "total_steps": 750, "loss": 0.7883, "lr": 7.971669825215789e-07, "epoch": 2.508, "percentage": 83.6, "elapsed_time": "9:46:05", "remaining_time": "1:54:58"}
|
628 |
+
{"current_steps": 628, "total_steps": 750, "loss": 0.7879, "lr": 7.846064256969571e-07, "epoch": 2.512, "percentage": 83.73, "elapsed_time": "9:46:57", "remaining_time": "1:54:01"}
|
629 |
+
{"current_steps": 629, "total_steps": 750, "loss": 0.797, "lr": 7.72137181227608e-07, "epoch": 2.516, "percentage": 83.87, "elapsed_time": "9:47:54", "remaining_time": "1:53:05"}
|
630 |
+
{"current_steps": 630, "total_steps": 750, "loss": 0.7693, "lr": 7.597595192178702e-07, "epoch": 2.52, "percentage": 84.0, "elapsed_time": "9:48:49", "remaining_time": "1:52:09"}
|
631 |
+
{"current_steps": 631, "total_steps": 750, "loss": 0.7791, "lr": 7.47473707788251e-07, "epoch": 2.524, "percentage": 84.13, "elapsed_time": "9:49:51", "remaining_time": "1:51:14"}
|
632 |
+
{"current_steps": 632, "total_steps": 750, "loss": 0.7548, "lr": 7.352800130696253e-07, "epoch": 2.528, "percentage": 84.27, "elapsed_time": "9:50:39", "remaining_time": "1:50:16"}
|
633 |
+
{"current_steps": 633, "total_steps": 750, "loss": 0.7598, "lr": 7.23178699197467e-07, "epoch": 2.532, "percentage": 84.4, "elapsed_time": "9:51:26", "remaining_time": "1:49:19"}
|
634 |
+
{"current_steps": 634, "total_steps": 750, "loss": 0.781, "lr": 7.111700283061318e-07, "epoch": 2.536, "percentage": 84.53, "elapsed_time": "9:52:22", "remaining_time": "1:48:23"}
|
635 |
+
{"current_steps": 635, "total_steps": 750, "loss": 0.7823, "lr": 6.992542605231739e-07, "epoch": 2.54, "percentage": 84.67, "elapsed_time": "9:53:11", "remaining_time": "1:47:25"}
|
636 |
+
{"current_steps": 636, "total_steps": 750, "loss": 0.7728, "lr": 6.874316539637127e-07, "epoch": 2.544, "percentage": 84.8, "elapsed_time": "9:54:02", "remaining_time": "1:46:28"}
|
637 |
+
{"current_steps": 637, "total_steps": 750, "loss": 0.8157, "lr": 6.757024647248456e-07, "epoch": 2.548, "percentage": 84.93, "elapsed_time": "9:55:07", "remaining_time": "1:45:34"}
|
638 |
+
{"current_steps": 638, "total_steps": 750, "loss": 0.7474, "lr": 6.640669468800947e-07, "epoch": 2.552, "percentage": 85.07, "elapsed_time": "9:56:02", "remaining_time": "1:44:38"}
|
639 |
+
{"current_steps": 639, "total_steps": 750, "loss": 0.7731, "lr": 6.52525352473905e-07, "epoch": 2.556, "percentage": 85.2, "elapsed_time": "9:57:00", "remaining_time": "1:43:42"}
|
640 |
+
{"current_steps": 640, "total_steps": 750, "loss": 0.75, "lr": 6.410779315161885e-07, "epoch": 2.56, "percentage": 85.33, "elapsed_time": "9:57:49", "remaining_time": "1:42:45"}
|
641 |
+
{"current_steps": 641, "total_steps": 750, "loss": 0.755, "lr": 6.297249319769016e-07, "epoch": 2.564, "percentage": 85.47, "elapsed_time": "9:58:40", "remaining_time": "1:41:48"}
|
642 |
+
{"current_steps": 642, "total_steps": 750, "loss": 0.7378, "lr": 6.184665997806832e-07, "epoch": 2.568, "percentage": 85.6, "elapsed_time": "9:59:28", "remaining_time": "1:40:50"}
|
643 |
+
{"current_steps": 643, "total_steps": 750, "loss": 0.7588, "lr": 6.073031788015133e-07, "epoch": 2.572, "percentage": 85.73, "elapsed_time": "10:00:23", "remaining_time": "1:39:54"}
|
644 |
+
{"current_steps": 644, "total_steps": 750, "loss": 0.7837, "lr": 5.962349108574478e-07, "epoch": 2.576, "percentage": 85.87, "elapsed_time": "10:01:20", "remaining_time": "1:38:58"}
|
645 |
+
{"current_steps": 645, "total_steps": 750, "loss": 0.7922, "lr": 5.852620357053651e-07, "epoch": 2.58, "percentage": 86.0, "elapsed_time": "10:02:16", "remaining_time": "1:38:02"}
|
646 |
+
{"current_steps": 646, "total_steps": 750, "loss": 0.7545, "lr": 5.743847910357836e-07, "epoch": 2.584, "percentage": 86.13, "elapsed_time": "10:03:06", "remaining_time": "1:37:05"}
|
647 |
+
{"current_steps": 647, "total_steps": 750, "loss": 0.8032, "lr": 5.636034124677043e-07, "epoch": 2.588, "percentage": 86.27, "elapsed_time": "10:04:04", "remaining_time": "1:36:10"}
|
648 |
+
{"current_steps": 648, "total_steps": 750, "loss": 0.781, "lr": 5.529181335435124e-07, "epoch": 2.592, "percentage": 86.4, "elapsed_time": "10:04:52", "remaining_time": "1:35:12"}
|
649 |
+
{"current_steps": 649, "total_steps": 750, "loss": 0.7701, "lr": 5.423291857239177e-07, "epoch": 2.596, "percentage": 86.53, "elapsed_time": "10:05:52", "remaining_time": "1:34:17"}
|
650 |
+
{"current_steps": 650, "total_steps": 750, "loss": 0.7526, "lr": 5.318367983829393e-07, "epoch": 2.6, "percentage": 86.67, "elapsed_time": "10:06:49", "remaining_time": "1:33:21"}
|
651 |
+
{"current_steps": 651, "total_steps": 750, "loss": 0.7531, "lr": 5.214411988029355e-07, "epoch": 2.604, "percentage": 86.8, "elapsed_time": "10:07:47", "remaining_time": "1:32:25"}
|
652 |
+
{"current_steps": 652, "total_steps": 750, "loss": 0.7993, "lr": 5.111426121696866e-07, "epoch": 2.608, "percentage": 86.93, "elapsed_time": "10:08:43", "remaining_time": "1:31:29"}
|
653 |
+
{"current_steps": 653, "total_steps": 750, "loss": 0.8017, "lr": 5.009412615675102e-07, "epoch": 2.612, "percentage": 87.07, "elapsed_time": "10:09:40", "remaining_time": "1:30:33"}
|
654 |
+
{"current_steps": 654, "total_steps": 750, "loss": 0.7407, "lr": 4.908373679744316e-07, "epoch": 2.616, "percentage": 87.2, "elapsed_time": "10:10:41", "remaining_time": "1:29:38"}
|
655 |
+
{"current_steps": 655, "total_steps": 750, "loss": 0.8001, "lr": 4.808311502573976e-07, "epoch": 2.62, "percentage": 87.33, "elapsed_time": "10:11:42", "remaining_time": "1:28:43"}
|
656 |
+
{"current_steps": 656, "total_steps": 750, "loss": 0.8007, "lr": 4.709228251675357e-07, "epoch": 2.624, "percentage": 87.47, "elapsed_time": "10:12:31", "remaining_time": "1:27:46"}
|
657 |
+
{"current_steps": 657, "total_steps": 750, "loss": 0.8044, "lr": 4.6111260733545714e-07, "epoch": 2.628, "percentage": 87.6, "elapsed_time": "10:13:26", "remaining_time": "1:26:50"}
|
658 |
+
{"current_steps": 658, "total_steps": 750, "loss": 0.7936, "lr": 4.514007092666084e-07, "epoch": 2.632, "percentage": 87.73, "elapsed_time": "10:14:26", "remaining_time": "1:25:54"}
|
659 |
+
{"current_steps": 659, "total_steps": 750, "loss": 0.7905, "lr": 4.417873413366702e-07, "epoch": 2.636, "percentage": 87.87, "elapsed_time": "10:15:24", "remaining_time": "1:24:58"}
|
660 |
+
{"current_steps": 660, "total_steps": 750, "loss": 0.781, "lr": 4.322727117869951e-07, "epoch": 2.64, "percentage": 88.0, "elapsed_time": "10:16:23", "remaining_time": "1:24:03"}
|
661 |
+
{"current_steps": 661, "total_steps": 750, "loss": 0.822, "lr": 4.228570267201049e-07, "epoch": 2.644, "percentage": 88.13, "elapsed_time": "10:17:14", "remaining_time": "1:23:06"}
|
662 |
+
{"current_steps": 662, "total_steps": 750, "loss": 0.7982, "lr": 4.1354049009521504e-07, "epoch": 2.648, "percentage": 88.27, "elapsed_time": "10:18:10", "remaining_time": "1:22:10"}
|
663 |
+
{"current_steps": 663, "total_steps": 750, "loss": 0.7581, "lr": 4.043233037238281e-07, "epoch": 2.652, "percentage": 88.4, "elapsed_time": "10:18:56", "remaining_time": "1:21:13"}
|
664 |
+
{"current_steps": 664, "total_steps": 750, "loss": 0.8131, "lr": 3.9520566726535367e-07, "epoch": 2.656, "percentage": 88.53, "elapsed_time": "10:19:55", "remaining_time": "1:20:17"}
|
665 |
+
{"current_steps": 665, "total_steps": 750, "loss": 0.7423, "lr": 3.8618777822278854e-07, "epoch": 2.66, "percentage": 88.67, "elapsed_time": "10:20:53", "remaining_time": "1:19:21"}
|
666 |
+
{"current_steps": 666, "total_steps": 750, "loss": 0.727, "lr": 3.772698319384349e-07, "epoch": 2.664, "percentage": 88.8, "elapsed_time": "10:21:44", "remaining_time": "1:18:25"}
|
667 |
+
{"current_steps": 667, "total_steps": 750, "loss": 0.7862, "lr": 3.684520215896703e-07, "epoch": 2.668, "percentage": 88.93, "elapsed_time": "10:22:46", "remaining_time": "1:17:29"}
|
668 |
+
{"current_steps": 668, "total_steps": 750, "loss": 0.7574, "lr": 3.597345381847656e-07, "epoch": 2.672, "percentage": 89.07, "elapsed_time": "10:23:43", "remaining_time": "1:16:33"}
|
669 |
+
{"current_steps": 669, "total_steps": 750, "loss": 0.7754, "lr": 3.511175705587433e-07, "epoch": 2.676, "percentage": 89.2, "elapsed_time": "10:24:34", "remaining_time": "1:15:37"}
|
670 |
+
{"current_steps": 670, "total_steps": 750, "loss": 0.7575, "lr": 3.426013053692878e-07, "epoch": 2.68, "percentage": 89.33, "elapsed_time": "10:25:43", "remaining_time": "1:14:42"}
|
671 |
+
{"current_steps": 671, "total_steps": 750, "loss": 0.7761, "lr": 3.341859270927067e-07, "epoch": 2.684, "percentage": 89.47, "elapsed_time": "10:26:37", "remaining_time": "1:13:46"}
|
672 |
+
{"current_steps": 672, "total_steps": 750, "loss": 0.7723, "lr": 3.258716180199278e-07, "epoch": 2.6879999999999997, "percentage": 89.6, "elapsed_time": "10:27:34", "remaining_time": "1:12:50"}
|
673 |
+
{"current_steps": 673, "total_steps": 750, "loss": 0.7849, "lr": 3.1765855825255543e-07, "epoch": 2.692, "percentage": 89.73, "elapsed_time": "10:28:34", "remaining_time": "1:11:55"}
|
674 |
+
{"current_steps": 674, "total_steps": 750, "loss": 0.7825, "lr": 3.0954692569896585e-07, "epoch": 2.6959999999999997, "percentage": 89.87, "elapsed_time": "10:29:39", "remaining_time": "1:10:59"}
|
675 |
+
{"current_steps": 675, "total_steps": 750, "loss": 0.7791, "lr": 3.015368960704584e-07, "epoch": 2.7, "percentage": 90.0, "elapsed_time": "10:30:42", "remaining_time": "1:10:04"}
|
676 |
+
{"current_steps": 676, "total_steps": 750, "loss": 0.7682, "lr": 2.9362864287744266e-07, "epoch": 2.7039999999999997, "percentage": 90.13, "elapsed_time": "10:31:30", "remaining_time": "1:09:07"}
|
677 |
+
{"current_steps": 677, "total_steps": 750, "loss": 0.7816, "lr": 2.858223374256841e-07, "epoch": 2.708, "percentage": 90.27, "elapsed_time": "10:32:28", "remaining_time": "1:08:11"}
|
678 |
+
{"current_steps": 678, "total_steps": 750, "loss": 0.7645, "lr": 2.7811814881259503e-07, "epoch": 2.7119999999999997, "percentage": 90.4, "elapsed_time": "10:33:20", "remaining_time": "1:07:15"}
|
679 |
+
{"current_steps": 679, "total_steps": 750, "loss": 0.7793, "lr": 2.705162439235648e-07, "epoch": 2.716, "percentage": 90.53, "elapsed_time": "10:34:21", "remaining_time": "1:06:19"}
|
680 |
+
{"current_steps": 680, "total_steps": 750, "loss": 0.7777, "lr": 2.63016787428354e-07, "epoch": 2.7199999999999998, "percentage": 90.67, "elapsed_time": "10:35:20", "remaining_time": "1:05:24"}
|
681 |
+
{"current_steps": 681, "total_steps": 750, "loss": 0.8064, "lr": 2.556199417775174e-07, "epoch": 2.724, "percentage": 90.8, "elapsed_time": "10:36:11", "remaining_time": "1:04:27"}
|
682 |
+
{"current_steps": 682, "total_steps": 750, "loss": 0.7664, "lr": 2.483258671988942e-07, "epoch": 2.7279999999999998, "percentage": 90.93, "elapsed_time": "10:37:12", "remaining_time": "1:03:32"}
|
683 |
+
{"current_steps": 683, "total_steps": 750, "loss": 0.768, "lr": 2.4113472169413176e-07, "epoch": 2.732, "percentage": 91.07, "elapsed_time": "10:38:10", "remaining_time": "1:02:36"}
|
684 |
+
{"current_steps": 684, "total_steps": 750, "loss": 0.7609, "lr": 2.3404666103526542e-07, "epoch": 2.7359999999999998, "percentage": 91.2, "elapsed_time": "10:39:18", "remaining_time": "1:01:41"}
|
685 |
+
{"current_steps": 685, "total_steps": 750, "loss": 0.8086, "lr": 2.2706183876134047e-07, "epoch": 2.74, "percentage": 91.33, "elapsed_time": "10:40:19", "remaining_time": "1:00:45"}
|
686 |
+
{"current_steps": 686, "total_steps": 750, "loss": 0.8176, "lr": 2.2018040617509174e-07, "epoch": 2.7439999999999998, "percentage": 91.47, "elapsed_time": "10:41:16", "remaining_time": "0:59:49"}
|
687 |
+
{"current_steps": 687, "total_steps": 750, "loss": 0.7824, "lr": 2.134025123396638e-07, "epoch": 2.748, "percentage": 91.6, "elapsed_time": "10:42:08", "remaining_time": "0:58:53"}
|
688 |
+
{"current_steps": 688, "total_steps": 750, "loss": 0.775, "lr": 2.0672830407537925e-07, "epoch": 2.752, "percentage": 91.73, "elapsed_time": "10:43:00", "remaining_time": "0:57:56"}
|
689 |
+
{"current_steps": 689, "total_steps": 750, "loss": 0.8086, "lr": 2.0015792595656225e-07, "epoch": 2.7560000000000002, "percentage": 91.87, "elapsed_time": "10:43:52", "remaining_time": "0:57:00"}
|
690 |
+
{"current_steps": 690, "total_steps": 750, "loss": 0.7897, "lr": 1.9369152030840553e-07, "epoch": 2.76, "percentage": 92.0, "elapsed_time": "10:44:48", "remaining_time": "0:56:04"}
|
691 |
+
{"current_steps": 691, "total_steps": 750, "loss": 0.7258, "lr": 1.873292272038868e-07, "epoch": 2.7640000000000002, "percentage": 92.13, "elapsed_time": "10:45:35", "remaining_time": "0:55:07"}
|
692 |
+
{"current_steps": 692, "total_steps": 750, "loss": 0.7727, "lr": 1.8107118446073492e-07, "epoch": 2.768, "percentage": 92.27, "elapsed_time": "10:46:21", "remaining_time": "0:54:10"}
|
693 |
+
{"current_steps": 693, "total_steps": 750, "loss": 0.7364, "lr": 1.7491752763844294e-07, "epoch": 2.7720000000000002, "percentage": 92.4, "elapsed_time": "10:47:07", "remaining_time": "0:53:13"}
|
694 |
+
{"current_steps": 694, "total_steps": 750, "loss": 0.769, "lr": 1.688683900353366e-07, "epoch": 2.776, "percentage": 92.53, "elapsed_time": "10:48:04", "remaining_time": "0:52:17"}
|
695 |
+
{"current_steps": 695, "total_steps": 750, "loss": 0.8167, "lr": 1.6292390268568103e-07, "epoch": 2.7800000000000002, "percentage": 92.67, "elapsed_time": "10:49:02", "remaining_time": "0:51:21"}
|
696 |
+
{"current_steps": 696, "total_steps": 750, "loss": 0.7854, "lr": 1.5708419435684463e-07, "epoch": 2.784, "percentage": 92.8, "elapsed_time": "10:49:59", "remaining_time": "0:50:25"}
|
697 |
+
{"current_steps": 697, "total_steps": 750, "loss": 0.7785, "lr": 1.5134939154651196e-07, "epoch": 2.7880000000000003, "percentage": 92.93, "elapsed_time": "10:50:46", "remaining_time": "0:49:29"}
|
698 |
+
{"current_steps": 698, "total_steps": 750, "loss": 0.782, "lr": 1.4571961847993977e-07, "epoch": 2.792, "percentage": 93.07, "elapsed_time": "10:51:44", "remaining_time": "0:48:33"}
|
699 |
+
{"current_steps": 699, "total_steps": 750, "loss": 0.776, "lr": 1.4019499710726913e-07, "epoch": 2.7960000000000003, "percentage": 93.2, "elapsed_time": "10:52:40", "remaining_time": "0:47:37"}
|
700 |
+
{"current_steps": 700, "total_steps": 750, "loss": 0.7813, "lr": 1.3477564710088097e-07, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "10:53:33", "remaining_time": "0:46:40"}
|
701 |
+
{"current_steps": 701, "total_steps": 750, "loss": 0.7608, "lr": 1.294616858528064e-07, "epoch": 2.8040000000000003, "percentage": 93.47, "elapsed_time": "10:54:28", "remaining_time": "0:45:44"}
|
702 |
+
{"current_steps": 702, "total_steps": 750, "loss": 0.7679, "lr": 1.2425322847218368e-07, "epoch": 2.808, "percentage": 93.6, "elapsed_time": "10:55:16", "remaining_time": "0:44:48"}
|
703 |
+
{"current_steps": 703, "total_steps": 750, "loss": 0.7511, "lr": 1.1915038778276212e-07, "epoch": 2.8120000000000003, "percentage": 93.73, "elapsed_time": "10:56:02", "remaining_time": "0:43:51"}
|
704 |
+
{"current_steps": 704, "total_steps": 750, "loss": 0.7406, "lr": 1.1415327432046041e-07, "epoch": 2.816, "percentage": 93.87, "elapsed_time": "10:57:05", "remaining_time": "0:42:56"}
|
705 |
+
{"current_steps": 705, "total_steps": 750, "loss": 0.8138, "lr": 1.0926199633097156e-07, "epoch": 2.82, "percentage": 94.0, "elapsed_time": "10:58:15", "remaining_time": "0:42:00"}
|
706 |
+
{"current_steps": 706, "total_steps": 750, "loss": 0.7478, "lr": 1.044766597674196e-07, "epoch": 2.824, "percentage": 94.13, "elapsed_time": "10:59:09", "remaining_time": "0:41:04"}
|
707 |
+
{"current_steps": 707, "total_steps": 750, "loss": 0.7825, "lr": 9.979736828806096e-08, "epoch": 2.828, "percentage": 94.27, "elapsed_time": "11:00:06", "remaining_time": "0:40:08"}
|
708 |
+
{"current_steps": 708, "total_steps": 750, "loss": 0.8049, "lr": 9.522422325404234e-08, "epoch": 2.832, "percentage": 94.4, "elapsed_time": "11:01:10", "remaining_time": "0:39:13"}
|
709 |
+
{"current_steps": 709, "total_steps": 750, "loss": 0.7697, "lr": 9.075732372720414e-08, "epoch": 2.836, "percentage": 94.53, "elapsed_time": "11:02:07", "remaining_time": "0:38:17"}
|
710 |
+
{"current_steps": 710, "total_steps": 750, "loss": 0.7875, "lr": 8.639676646793382e-08, "epoch": 2.84, "percentage": 94.67, "elapsed_time": "11:03:08", "remaining_time": "0:37:21"}
|
711 |
+
{"current_steps": 711, "total_steps": 750, "loss": 0.7587, "lr": 8.214264593307097e-08, "epoch": 2.844, "percentage": 94.8, "elapsed_time": "11:03:59", "remaining_time": "0:36:25"}
|
712 |
+
{"current_steps": 712, "total_steps": 750, "loss": 0.7964, "lr": 7.799505427386001e-08, "epoch": 2.848, "percentage": 94.93, "elapsed_time": "11:05:00", "remaining_time": "0:35:29"}
|
713 |
+
{"current_steps": 713, "total_steps": 750, "loss": 0.7781, "lr": 7.395408133395509e-08, "epoch": 2.852, "percentage": 95.07, "elapsed_time": "11:06:00", "remaining_time": "0:34:33"}
|
714 |
+
{"current_steps": 714, "total_steps": 750, "loss": 0.7413, "lr": 7.001981464747565e-08, "epoch": 2.856, "percentage": 95.2, "elapsed_time": "11:06:43", "remaining_time": "0:33:36"}
|
715 |
+
{"current_steps": 715, "total_steps": 750, "loss": 0.7592, "lr": 6.61923394371039e-08, "epoch": 2.86, "percentage": 95.33, "elapsed_time": "11:07:37", "remaining_time": "0:32:40"}
|
716 |
+
{"current_steps": 716, "total_steps": 750, "loss": 0.7833, "lr": 6.247173861224753e-08, "epoch": 2.864, "percentage": 95.47, "elapsed_time": "11:08:37", "remaining_time": "0:31:45"}
|
717 |
+
{"current_steps": 717, "total_steps": 750, "loss": 0.8241, "lr": 5.8858092767236084e-08, "epoch": 2.868, "percentage": 95.6, "elapsed_time": "11:09:40", "remaining_time": "0:30:49"}
|
718 |
+
{"current_steps": 718, "total_steps": 750, "loss": 0.775, "lr": 5.535148017958014e-08, "epoch": 2.872, "percentage": 95.73, "elapsed_time": "11:10:33", "remaining_time": "0:29:53"}
|
719 |
+
{"current_steps": 719, "total_steps": 750, "loss": 0.7998, "lr": 5.19519768082738e-08, "epoch": 2.876, "percentage": 95.87, "elapsed_time": "11:11:34", "remaining_time": "0:28:57"}
|
720 |
+
{"current_steps": 720, "total_steps": 750, "loss": 0.728, "lr": 4.865965629214819e-08, "epoch": 2.88, "percentage": 96.0, "elapsed_time": "11:12:27", "remaining_time": "0:28:01"}
|
721 |
+
{"current_steps": 721, "total_steps": 750, "loss": 0.7968, "lr": 4.5474589948280026e-08, "epoch": 2.884, "percentage": 96.13, "elapsed_time": "11:13:32", "remaining_time": "0:27:05"}
|
722 |
+
{"current_steps": 722, "total_steps": 750, "loss": 0.798, "lr": 4.2396846770441644e-08, "epoch": 2.888, "percentage": 96.27, "elapsed_time": "11:14:30", "remaining_time": "0:26:09"}
|
723 |
+
{"current_steps": 723, "total_steps": 750, "loss": 0.7847, "lr": 3.9426493427611177e-08, "epoch": 2.892, "percentage": 96.4, "elapsed_time": "11:15:21", "remaining_time": "0:25:13"}
|
724 |
+
{"current_steps": 724, "total_steps": 750, "loss": 0.8021, "lr": 3.65635942625242e-08, "epoch": 2.896, "percentage": 96.53, "elapsed_time": "11:16:20", "remaining_time": "0:24:17"}
|
725 |
+
{"current_steps": 725, "total_steps": 750, "loss": 0.8147, "lr": 3.3808211290284886e-08, "epoch": 2.9, "percentage": 96.67, "elapsed_time": "11:17:21", "remaining_time": "0:23:21"}
|
726 |
+
{"current_steps": 726, "total_steps": 750, "loss": 0.794, "lr": 3.1160404197018155e-08, "epoch": 2.904, "percentage": 96.8, "elapsed_time": "11:18:19", "remaining_time": "0:22:25"}
|
727 |
+
{"current_steps": 727, "total_steps": 750, "loss": 0.7908, "lr": 2.8620230338578526e-08, "epoch": 2.908, "percentage": 96.93, "elapsed_time": "11:19:18", "remaining_time": "0:21:29"}
|
728 |
+
{"current_steps": 728, "total_steps": 750, "loss": 0.8137, "lr": 2.6187744739308297e-08, "epoch": 2.912, "percentage": 97.07, "elapsed_time": "11:20:18", "remaining_time": "0:20:33"}
|
729 |
+
{"current_steps": 729, "total_steps": 750, "loss": 0.764, "lr": 2.386300009084408e-08, "epoch": 2.916, "percentage": 97.2, "elapsed_time": "11:21:09", "remaining_time": "0:19:37"}
|
730 |
+
{"current_steps": 730, "total_steps": 750, "loss": 0.7881, "lr": 2.1646046750978255e-08, "epoch": 2.92, "percentage": 97.33, "elapsed_time": "11:22:01", "remaining_time": "0:18:41"}
|
731 |
+
{"current_steps": 731, "total_steps": 750, "loss": 0.764, "lr": 1.953693274256374e-08, "epoch": 2.924, "percentage": 97.47, "elapsed_time": "11:22:49", "remaining_time": "0:17:44"}
|
732 |
+
{"current_steps": 732, "total_steps": 750, "loss": 0.7774, "lr": 1.753570375247815e-08, "epoch": 2.928, "percentage": 97.6, "elapsed_time": "11:23:47", "remaining_time": "0:16:48"}
|
733 |
+
{"current_steps": 733, "total_steps": 750, "loss": 0.7491, "lr": 1.5642403130632367e-08, "epoch": 2.932, "percentage": 97.73, "elapsed_time": "11:24:47", "remaining_time": "0:15:52"}
|
734 |
+
{"current_steps": 734, "total_steps": 750, "loss": 0.7755, "lr": 1.3857071889029073e-08, "epoch": 2.936, "percentage": 97.87, "elapsed_time": "11:25:40", "remaining_time": "0:14:56"}
|
735 |
+
{"current_steps": 735, "total_steps": 750, "loss": 0.7924, "lr": 1.2179748700879013e-08, "epoch": 2.94, "percentage": 98.0, "elapsed_time": "11:26:31", "remaining_time": "0:14:00"}
|
736 |
+
{"current_steps": 736, "total_steps": 750, "loss": 0.8068, "lr": 1.0610469899760001e-08, "epoch": 2.944, "percentage": 98.13, "elapsed_time": "11:27:16", "remaining_time": "0:13:04"}
|
737 |
+
{"current_steps": 737, "total_steps": 750, "loss": 0.7816, "lr": 9.14926947883088e-09, "epoch": 2.948, "percentage": 98.27, "elapsed_time": "11:28:09", "remaining_time": "0:12:08"}
|
738 |
+
{"current_steps": 738, "total_steps": 750, "loss": 0.7837, "lr": 7.796179090094891e-09, "epoch": 2.952, "percentage": 98.4, "elapsed_time": "11:29:02", "remaining_time": "0:11:12"}
|
739 |
+
{"current_steps": 739, "total_steps": 750, "loss": 0.8002, "lr": 6.551228043715218e-09, "epoch": 2.956, "percentage": 98.53, "elapsed_time": "11:30:08", "remaining_time": "0:10:16"}
|
740 |
+
{"current_steps": 740, "total_steps": 750, "loss": 0.7759, "lr": 5.414443307377171e-09, "epoch": 2.96, "percentage": 98.67, "elapsed_time": "11:30:57", "remaining_time": "0:09:20"}
|
741 |
+
{"current_steps": 741, "total_steps": 750, "loss": 0.7821, "lr": 4.385849505708084e-09, "epoch": 2.964, "percentage": 98.8, "elapsed_time": "11:32:01", "remaining_time": "0:08:24"}
|
742 |
+
{"current_steps": 742, "total_steps": 750, "loss": 0.7754, "lr": 3.4654689197405335e-09, "epoch": 2.968, "percentage": 98.93, "elapsed_time": "11:33:10", "remaining_time": "0:07:28"}
|
743 |
+
{"current_steps": 743, "total_steps": 750, "loss": 0.7755, "lr": 2.6533214864310485e-09, "epoch": 2.972, "percentage": 99.07, "elapsed_time": "11:34:03", "remaining_time": "0:06:32"}
|
744 |
+
{"current_steps": 744, "total_steps": 750, "loss": 0.7779, "lr": 1.9494247982282386e-09, "epoch": 2.976, "percentage": 99.2, "elapsed_time": "11:34:57", "remaining_time": "0:05:36"}
|
745 |
+
{"current_steps": 745, "total_steps": 750, "loss": 0.7995, "lr": 1.3537941026914302e-09, "epoch": 2.98, "percentage": 99.33, "elapsed_time": "11:35:52", "remaining_time": "0:04:40"}
|
746 |
+
{"current_steps": 746, "total_steps": 750, "loss": 0.7679, "lr": 8.664423021614854e-10, "epoch": 2.984, "percentage": 99.47, "elapsed_time": "11:36:50", "remaining_time": "0:03:44"}
|
747 |
+
{"current_steps": 747, "total_steps": 750, "loss": 0.8057, "lr": 4.87379953478806e-10, "epoch": 2.988, "percentage": 99.6, "elapsed_time": "11:37:44", "remaining_time": "0:02:48"}
|
748 |
+
{"current_steps": 748, "total_steps": 750, "loss": 0.7728, "lr": 2.1661526775795804e-10, "epoch": 2.992, "percentage": 99.73, "elapsed_time": "11:38:45", "remaining_time": "0:01:52"}
|
749 |
+
{"current_steps": 749, "total_steps": 750, "loss": 0.7773, "lr": 5.4154110206150465e-11, "epoch": 2.996, "percentage": 99.87, "elapsed_time": "11:39:41", "remaining_time": "0:00:56"}
|
750 |
+
{"current_steps": 750, "total_steps": 750, "loss": 0.7804, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "11:40:36", "remaining_time": "0:00:00"}
|
751 |
+
{"current_steps": 750, "total_steps": 750, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "11:42:43", "remaining_time": "0:00:00"}
|