File size: 15,593 Bytes
408517c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
{"current_steps": 5, "total_steps": 312, "loss": 2.8923, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00019987329060020616, "epoch": 0.02, "percentage": 1.6, "elapsed_time": "0:00:44", "remaining_time": "0:45:07"}
{"current_steps": 10, "total_steps": 312, "loss": 2.0944, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00019949348350626456, "epoch": 0.03, "percentage": 3.21, "elapsed_time": "0:01:26", "remaining_time": "0:43:22"}
{"current_steps": 15, "total_steps": 312, "loss": 2.0323, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00019886154122075343, "epoch": 0.05, "percentage": 4.81, "elapsed_time": "0:02:12", "remaining_time": "0:43:39"}
{"current_steps": 20, "total_steps": 312, "loss": 1.9436, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00019797906520422677, "epoch": 0.06, "percentage": 6.41, "elapsed_time": "0:02:57", "remaining_time": "0:43:14"}
{"current_steps": 25, "total_steps": 312, "loss": 2.0292, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00019684829181681234, "epoch": 0.08, "percentage": 8.01, "elapsed_time": "0:03:41", "remaining_time": "0:42:24"}
{"current_steps": 30, "total_steps": 312, "loss": 1.9654, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00019547208665085457, "epoch": 0.1, "percentage": 9.62, "elapsed_time": "0:04:18", "remaining_time": "0:40:33"}
{"current_steps": 35, "total_steps": 312, "loss": 1.9041, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0001938539372689649, "epoch": 0.11, "percentage": 11.22, "elapsed_time": "0:04:58", "remaining_time": "0:39:18"}
{"current_steps": 40, "total_steps": 312, "loss": 1.8992, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00019199794436588243, "epoch": 0.13, "percentage": 12.82, "elapsed_time": "0:05:39", "remaining_time": "0:38:30"}
{"current_steps": 45, "total_steps": 312, "loss": 1.8393, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00018990881137654258, "epoch": 0.14, "percentage": 14.42, "elapsed_time": "0:06:24", "remaining_time": "0:38:02"}
{"current_steps": 50, "total_steps": 312, "loss": 1.615, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0001875918325566888, "epoch": 0.16, "percentage": 16.03, "elapsed_time": "0:07:08", "remaining_time": "0:37:27"}
{"current_steps": 55, "total_steps": 312, "loss": 1.9873, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00018505287956623297, "epoch": 0.18, "percentage": 17.63, "elapsed_time": "0:07:48", "remaining_time": "0:36:29"}
{"current_steps": 60, "total_steps": 312, "loss": 1.9264, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00018229838658936564, "epoch": 0.19, "percentage": 19.23, "elapsed_time": "0:08:33", "remaining_time": "0:35:58"}
{"current_steps": 65, "total_steps": 312, "loss": 1.828, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00017933533402912354, "epoch": 0.21, "percentage": 20.83, "elapsed_time": "0:09:19", "remaining_time": "0:35:24"}
{"current_steps": 70, "total_steps": 312, "loss": 1.8083, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00017617123081773591, "epoch": 0.22, "percentage": 22.44, "elapsed_time": "0:09:58", "remaining_time": "0:34:30"}
{"current_steps": 75, "total_steps": 312, "loss": 1.8268, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00017281409538757883, "epoch": 0.24, "percentage": 24.04, "elapsed_time": "0:10:38", "remaining_time": "0:33:36"}
{"current_steps": 80, "total_steps": 312, "loss": 1.7587, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00016927243535095997, "epoch": 0.26, "percentage": 25.64, "elapsed_time": "0:11:19", "remaining_time": "0:32:50"}
{"current_steps": 85, "total_steps": 312, "loss": 1.7939, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0001655552259402295, "epoch": 0.27, "percentage": 27.24, "elapsed_time": "0:12:06", "remaining_time": "0:32:19"}
{"current_steps": 90, "total_steps": 312, "loss": 1.848, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00016167188726285434, "epoch": 0.29, "percentage": 28.85, "elapsed_time": "0:12:46", "remaining_time": "0:31:31"}
{"current_steps": 95, "total_steps": 312, "loss": 1.7407, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00015763226042909455, "epoch": 0.3, "percentage": 30.45, "elapsed_time": "0:13:24", "remaining_time": "0:30:37"}
{"current_steps": 100, "total_steps": 312, "loss": 1.8559, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0001534465826127801, "epoch": 0.32, "percentage": 32.05, "elapsed_time": "0:14:12", "remaining_time": "0:30:06"}
{"current_steps": 105, "total_steps": 312, "loss": 1.8363, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00014912546110838775, "epoch": 0.34, "percentage": 33.65, "elapsed_time": "0:14:56", "remaining_time": "0:29:27"}
{"current_steps": 110, "total_steps": 312, "loss": 1.6798, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00014467984645016258, "epoch": 0.35, "percentage": 35.26, "elapsed_time": "0:15:40", "remaining_time": "0:28:47"}
{"current_steps": 115, "total_steps": 312, "loss": 1.6868, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00014012100466140578, "epoch": 0.37, "percentage": 36.86, "elapsed_time": "0:16:25", "remaining_time": "0:28:09"}
{"current_steps": 120, "total_steps": 312, "loss": 1.8213, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00013546048870425356, "epoch": 0.38, "percentage": 38.46, "elapsed_time": "0:17:09", "remaining_time": "0:27:27"}
{"current_steps": 125, "total_steps": 312, "loss": 1.7561, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00013071010920229909, "epoch": 0.4, "percentage": 40.06, "elapsed_time": "0:17:54", "remaining_time": "0:26:46"}
{"current_steps": 130, "total_steps": 312, "loss": 1.7834, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00012588190451025207, "epoch": 0.42, "percentage": 41.67, "elapsed_time": "0:18:38", "remaining_time": "0:26:06"}
{"current_steps": 135, "total_steps": 312, "loss": 1.9342, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00012098811020648475, "epoch": 0.43, "percentage": 43.27, "elapsed_time": "0:19:27", "remaining_time": "0:25:30"}
{"current_steps": 140, "total_steps": 312, "loss": 1.8081, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00011604112808577603, "epoch": 0.45, "percentage": 44.87, "elapsed_time": "0:20:14", "remaining_time": "0:24:52"}
{"current_steps": 145, "total_steps": 312, "loss": 1.7449, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.000111053494730832, "epoch": 0.46, "percentage": 46.47, "elapsed_time": "0:21:00", "remaining_time": "0:24:11"}
{"current_steps": 150, "total_steps": 312, "loss": 1.8202, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00010603784974222861, "epoch": 0.48, "percentage": 48.08, "elapsed_time": "0:21:41", "remaining_time": "0:23:25"}
{"current_steps": 155, "total_steps": 312, "loss": 1.7587, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00010100690370728755, "epoch": 0.5, "percentage": 49.68, "elapsed_time": "0:22:24", "remaining_time": "0:22:41"}
{"current_steps": 160, "total_steps": 312, "loss": 1.8827, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.597340598905852e-05, "epoch": 0.51, "percentage": 51.28, "elapsed_time": "0:23:07", "remaining_time": "0:21:58"}
{"current_steps": 165, "total_steps": 312, "loss": 1.8022, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.095011241703623e-05, "epoch": 0.53, "percentage": 52.88, "elapsed_time": "0:23:45", "remaining_time": "0:21:09"}
{"current_steps": 170, "total_steps": 312, "loss": 1.7515, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.594975296149076e-05, "epoch": 0.54, "percentage": 54.49, "elapsed_time": "0:24:31", "remaining_time": "0:20:28"}
{"current_steps": 175, "total_steps": 312, "loss": 1.7027, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.098499947332934e-05, "epoch": 0.56, "percentage": 56.09, "elapsed_time": "0:25:12", "remaining_time": "0:19:44"}
{"current_steps": 180, "total_steps": 312, "loss": 1.7445, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.606843357124426e-05, "epoch": 0.58, "percentage": 57.69, "elapsed_time": "0:25:55", "remaining_time": "0:19:00"}
{"current_steps": 185, "total_steps": 312, "loss": 1.7094, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.121251475752539e-05, "epoch": 0.59, "percentage": 59.29, "elapsed_time": "0:26:35", "remaining_time": "0:18:15"}
{"current_steps": 190, "total_steps": 312, "loss": 1.7047, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.642954884333955e-05, "epoch": 0.61, "percentage": 60.9, "elapsed_time": "0:27:15", "remaining_time": "0:17:30"}
{"current_steps": 195, "total_steps": 312, "loss": 1.6086, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.173165676349103e-05, "epoch": 0.62, "percentage": 62.5, "elapsed_time": "0:27:56", "remaining_time": "0:16:46"}
{"current_steps": 200, "total_steps": 312, "loss": 1.7098, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.713074385969457e-05, "epoch": 0.64, "percentage": 64.1, "elapsed_time": "0:28:41", "remaining_time": "0:16:03"}
{"current_steps": 205, "total_steps": 312, "loss": 1.7766, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.263846971020108e-05, "epoch": 0.66, "percentage": 65.71, "elapsed_time": "0:29:23", "remaining_time": "0:15:20"}
{"current_steps": 210, "total_steps": 312, "loss": 1.9863, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.826621858223431e-05, "epoch": 0.67, "percentage": 67.31, "elapsed_time": "0:30:02", "remaining_time": "0:14:35"}
{"current_steps": 215, "total_steps": 312, "loss": 1.7957, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.40250705821178e-05, "epoch": 0.69, "percentage": 68.91, "elapsed_time": "0:30:42", "remaining_time": "0:13:51"}
{"current_steps": 220, "total_steps": 312, "loss": 1.7848, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.99257735762021e-05, "epoch": 0.7, "percentage": 70.51, "elapsed_time": "0:31:25", "remaining_time": "0:13:08"}
{"current_steps": 225, "total_steps": 312, "loss": 1.8688, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.597871595375121e-05, "epoch": 0.72, "percentage": 72.12, "elapsed_time": "0:32:07", "remaining_time": "0:12:25"}
{"current_steps": 230, "total_steps": 312, "loss": 1.6451, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.219390030081091e-05, "epoch": 0.74, "percentage": 73.72, "elapsed_time": "0:32:50", "remaining_time": "0:11:42"}
{"current_steps": 235, "total_steps": 312, "loss": 1.8795, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.858091805177554e-05, "epoch": 0.75, "percentage": 75.32, "elapsed_time": "0:33:32", "remaining_time": "0:10:59"}
{"current_steps": 240, "total_steps": 312, "loss": 1.7631, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.514892518288988e-05, "epoch": 0.77, "percentage": 76.92, "elapsed_time": "0:34:15", "remaining_time": "0:10:16"}
{"current_steps": 245, "total_steps": 312, "loss": 1.7843, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.1906619009284257e-05, "epoch": 0.78, "percentage": 78.53, "elapsed_time": "0:34:56", "remaining_time": "0:09:33"}
{"current_steps": 250, "total_steps": 312, "loss": 1.7854, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8862216144342692e-05, "epoch": 0.8, "percentage": 80.13, "elapsed_time": "0:35:41", "remaining_time": "0:08:51"}
{"current_steps": 255, "total_steps": 312, "loss": 1.5676, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6023431677260214e-05, "epoch": 0.82, "percentage": 81.73, "elapsed_time": "0:36:23", "remaining_time": "0:08:08"}
{"current_steps": 260, "total_steps": 312, "loss": 1.6083, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.339745962155613e-05, "epoch": 0.83, "percentage": 83.33, "elapsed_time": "0:37:14", "remaining_time": "0:07:26"}
{"current_steps": 265, "total_steps": 312, "loss": 1.8291, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0990954684091558e-05, "epoch": 0.85, "percentage": 84.94, "elapsed_time": "0:37:55", "remaining_time": "0:06:43"}
{"current_steps": 270, "total_steps": 312, "loss": 1.7606, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.810015400790994e-06, "epoch": 0.86, "percentage": 86.54, "elapsed_time": "0:38:40", "remaining_time": "0:06:01"}
{"current_steps": 275, "total_steps": 312, "loss": 1.7076, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.860168681805945e-06, "epoch": 0.88, "percentage": 88.14, "elapsed_time": "0:39:25", "remaining_time": "0:05:18"}
{"current_steps": 280, "total_steps": 312, "loss": 1.706, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.146355805285452e-06, "epoch": 0.9, "percentage": 89.74, "elapsed_time": "0:40:09", "remaining_time": "0:04:35"}
{"current_steps": 285, "total_steps": 312, "loss": 1.7685, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.6729198952483724e-06, "epoch": 0.91, "percentage": 91.35, "elapsed_time": "0:40:56", "remaining_time": "0:03:52"}
{"current_steps": 290, "total_steps": 312, "loss": 1.7422, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4435949152906145e-06, "epoch": 0.93, "percentage": 92.95, "elapsed_time": "0:41:35", "remaining_time": "0:03:09"}
{"current_steps": 295, "total_steps": 312, "loss": 1.8109, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4614962060194304e-06, "epoch": 0.94, "percentage": 94.55, "elapsed_time": "0:42:19", "remaining_time": "0:02:26"}
{"current_steps": 300, "total_steps": 312, "loss": 1.7055, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.291125901946027e-07, "epoch": 0.96, "percentage": 96.15, "elapsed_time": "0:43:04", "remaining_time": "0:01:43"}
{"current_steps": 305, "total_steps": 312, "loss": 1.73, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4830006558373973e-07, "epoch": 0.98, "percentage": 97.76, "elapsed_time": "0:43:47", "remaining_time": "0:01:00"}
{"current_steps": 310, "total_steps": 312, "loss": 1.9092, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0277101514987184e-08, "epoch": 0.99, "percentage": 99.36, "elapsed_time": "0:44:31", "remaining_time": "0:00:17"}
{"current_steps": 312, "total_steps": 312, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:44:45", "remaining_time": "0:00:00"}