{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.4066641958384616, | |
"eval_loss": 3.41624116897583, | |
"eval_runtime": 153.8779, | |
"eval_samples": 57921, | |
"eval_samples_per_second": 376.409, | |
"eval_steps_per_second": 5.888, | |
"perplexity": 30.45472543989185, | |
"total_flos": 1.5669257538816e+18, | |
"train_loss": 3.1555080074711364, | |
"train_runtime": 80953.5697, | |
"train_samples": 595035, | |
"train_samples_per_second": 147.006, | |
"train_steps_per_second": 4.594 | |
} |