{ | |
"epoch": 19.99718982717437, | |
"eval_accuracy": 0.4210676920791576, | |
"eval_loss": 3.009352207183838, | |
"eval_runtime": 128.3569, | |
"eval_samples": 45143, | |
"eval_samples_per_second": 351.699, | |
"eval_steps_per_second": 5.5, | |
"perplexity": 20.274262149048695, | |
"total_flos": 1.18991215558656e+18, | |
"train_loss": 3.2179960425614373, | |
"train_runtime": 62492.0089, | |
"train_samples": 455458, | |
"train_samples_per_second": 145.765, | |
"train_steps_per_second": 0.569 | |
} |