{ | |
"epoch": 1.0, | |
"eval_loss": 2.18013596534729, | |
"eval_runtime": 9.846, | |
"eval_samples_per_second": 22.141, | |
"eval_steps_per_second": 2.844, | |
"perplexity": 8.847509131596244, | |
"total_flos": 2.42426139967488e+16, | |
"train_loss": 2.3308336977473276, | |
"train_runtime": 355.7712, | |
"train_samples_per_second": 7.508, | |
"train_steps_per_second": 3.755 | |
} |