{ | |
"epoch": 4.0, | |
"eval_loss": 2.4018473625183105, | |
"eval_runtime": 343.4017, | |
"eval_samples_per_second": 205.89, | |
"eval_steps_per_second": 1.61, | |
"perplexity": 11.043559004771115, | |
"total_flos": 4159012790599680.0, | |
"train_loss": 0.7021765150223461, | |
"train_runtime": 17437.0559, | |
"train_samples_per_second": 145.971, | |
"train_steps_per_second": 2.281 | |
} |