{ | |
"epoch": 30.0, | |
"eval_accuracy": 0.15905819453012543, | |
"eval_loss": 6.060703277587891, | |
"eval_runtime": 50.7232, | |
"eval_samples": 8106, | |
"eval_samples_per_second": 159.809, | |
"eval_steps_per_second": 39.962, | |
"perplexity": 428.67680966518134, | |
"total_flos": 1.773277289442432e+16, | |
"train_loss": 3.0397992164007466, | |
"train_runtime": 4647.9256, | |
"train_samples": 160441, | |
"train_samples_per_second": 1035.565, | |
"train_steps_per_second": 8.094 | |
} |