{ | |
"epoch": 19.970717423133237, | |
"eval_accuracy": 0.4408205128205128, | |
"eval_loss": 4.3716583251953125, | |
"eval_runtime": 5.3473, | |
"eval_samples": 500, | |
"eval_samples_per_second": 93.505, | |
"eval_steps_per_second": 11.782, | |
"perplexity": 79.17482049231646, | |
"total_flos": 5.856471132500132e+17, | |
"train_loss": 1.4925127781730942, | |
"train_runtime": 14626.8571, | |
"train_samples": 10925, | |
"train_samples_per_second": 14.938, | |
"train_steps_per_second": 0.466 | |
} |