{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.4080815719204785, | |
"eval_loss": 3.3971192836761475, | |
"eval_runtime": 153.9706, | |
"eval_samples": 57918, | |
"eval_samples_per_second": 376.163, | |
"eval_steps_per_second": 5.878, | |
"perplexity": 29.87790618490111, | |
"total_flos": 1.5667414205184e+18, | |
"train_loss": 3.1547193204799435, | |
"train_runtime": 81066.2548, | |
"train_samples": 594965, | |
"train_samples_per_second": 146.785, | |
"train_steps_per_second": 4.587 | |
} |