{ | |
"epoch": 0.99968, | |
"eval_loss": 1.097437858581543, | |
"eval_runtime": 230.0389, | |
"eval_samples": 12500, | |
"eval_samples_per_second": 54.339, | |
"eval_steps_per_second": 6.795, | |
"perplexity": 2.9964787778596422, | |
"total_flos": 6.457467788899123e+16, | |
"train_loss": 1.3367621437688184, | |
"train_runtime": 11215.3396, | |
"train_samples": 100000, | |
"train_samples_per_second": 8.916, | |
"train_steps_per_second": 0.139 | |
} |