{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.7918744394618834, | |
"eval_loss": 0.45650961995124817, | |
"eval_runtime": 6.6411, | |
"eval_samples": 500, | |
"eval_samples_per_second": 75.288, | |
"eval_steps_per_second": 9.486, | |
"perplexity": 1.5785546027358068, | |
"total_flos": 9.64242245391745e+17, | |
"train_loss": 0.42894544871858475, | |
"train_runtime": 22582.9978, | |
"train_samples": 16925, | |
"train_samples_per_second": 14.989, | |
"train_steps_per_second": 0.468 | |
} |