{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.6793461178036027, | |
"eval_loss": 3.871241331100464, | |
"eval_runtime": 173.6845, | |
"eval_samples": 120706, | |
"eval_samples_per_second": 694.973, | |
"eval_steps_per_second": 4.347, | |
"perplexity": 48.001935408261254, | |
"total_flos": 3.039073706855117e+18, | |
"train_loss": 4.565901666523048, | |
"train_runtime": 125705.0232, | |
"train_samples": 2277342, | |
"train_samples_per_second": 452.914, | |
"train_steps_per_second": 2.831 | |
} |