{ | |
"epoch": 1.0, | |
"eval_loss": 2.1312263011932373, | |
"eval_runtime": 2.6837, | |
"eval_samples_per_second": 13.787, | |
"eval_steps_per_second": 1.863, | |
"perplexity": 8.425192302438928, | |
"total_flos": 4161668422041600.0, | |
"train_loss": 2.3460041029484513, | |
"train_runtime": 71.1285, | |
"train_samples_per_second": 6.439, | |
"train_steps_per_second": 3.22 | |
} |