{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.7134618834080717, | |
"eval_loss": 0.9358564019203186, | |
"eval_runtime": 6.0586, | |
"eval_samples": 500, | |
"eval_samples_per_second": 82.527, | |
"eval_steps_per_second": 10.398, | |
"perplexity": 2.549395830596446, | |
"total_flos": 9.64242245391745e+17, | |
"train_loss": 1.2100651977192927, | |
"train_runtime": 22841.5406, | |
"train_samples": 16925, | |
"train_samples_per_second": 14.819, | |
"train_steps_per_second": 0.463 | |
} |