{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.6657583697234353, | |
"eval_loss": 1.8696147203445435, | |
"eval_runtime": 8.0567, | |
"eval_samples": 500, | |
"eval_samples_per_second": 62.06, | |
"eval_steps_per_second": 7.82, | |
"perplexity": 6.485797072186353, | |
"total_flos": 9.221411586147615e+17, | |
"train_loss": 1.163707649230957, | |
"train_runtime": 11749.7477, | |
"train_samples": 8000, | |
"train_samples_per_second": 13.617, | |
"train_steps_per_second": 0.426 | |
} |