{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.47418153806650404, | |
"eval_loss": 3.3325774669647217, | |
"eval_runtime": 29.361, | |
"eval_samples": 4053, | |
"eval_samples_per_second": 138.04, | |
"eval_steps_per_second": 34.536, | |
"perplexity": 28.01044473770335, | |
"total_flos": 1.0559446100070912e+17, | |
"train_loss": 0.8717835233465437, | |
"train_runtime": 7516.252, | |
"train_samples": 80219, | |
"train_samples_per_second": 213.455, | |
"train_steps_per_second": 13.342 | |
} |