|
{"current_steps": 50, "total_steps": 356, "loss": 3.712, "learning_rate": 9.53723622631339e-06, "epoch": 0.2807017543859649, "percentage": 14.04, "elapsed_time": "0:09:50", "remaining_time": "1:00:13", "throughput": 1398.43, "total_tokens": 825600} |
|
{"current_steps": 100, "total_steps": 356, "loss": 0.1276, "learning_rate": 8.20073735379715e-06, "epoch": 0.5614035087719298, "percentage": 28.09, "elapsed_time": "0:19:40", "remaining_time": "0:50:21", "throughput": 1399.22, "total_tokens": 1651200} |
|
{"current_steps": 150, "total_steps": 356, "loss": 0.0644, "learning_rate": 6.247734714199105e-06, "epoch": 0.8421052631578947, "percentage": 42.13, "elapsed_time": "0:29:29", "remaining_time": "0:40:29", "throughput": 1399.82, "total_tokens": 2476800} |
|
{"current_steps": 200, "total_steps": 356, "loss": 0.0091, "learning_rate": 4.054402092289354e-06, "epoch": 1.1228070175438596, "percentage": 56.18, "elapsed_time": "0:39:18", "remaining_time": "0:30:39", "throughput": 1400.01, "total_tokens": 3302400} |
|
{"current_steps": 250, "total_steps": 356, "loss": 0.0451, "learning_rate": 2.0432039624699016e-06, "epoch": 1.4035087719298245, "percentage": 70.22, "elapsed_time": "0:49:08", "remaining_time": "0:20:49", "throughput": 1400.24, "total_tokens": 4128000} |
|
{"current_steps": 300, "total_steps": 356, "loss": 0.0004, "learning_rate": 6.015233200716874e-07, "epoch": 1.6842105263157894, "percentage": 84.27, "elapsed_time": "0:58:57", "remaining_time": "0:11:00", "throughput": 1400.34, "total_tokens": 4953600} |
|
{"current_steps": 350, "total_steps": 356, "loss": 0.0069, "learning_rate": 7.046663148979616e-09, "epoch": 1.9649122807017543, "percentage": 98.31, "elapsed_time": "1:08:46", "remaining_time": "0:01:10", "throughput": 1400.38, "total_tokens": 5779200} |
|
{"current_steps": 356, "total_steps": 356, "epoch": 1.9985964912280703, "percentage": 100.0, "elapsed_time": "1:09:58", "remaining_time": "0:00:00", "throughput": 1400.1, "total_tokens": 5878272} |
|
|