{ | |
"epoch": 0.4298328355080438, | |
"eval_accuracy": 0.37965929269827176, | |
"eval_loss": 3.1287243366241455, | |
"eval_perplexity": 22.844818648175387, | |
"eval_runtime": 523.5836, | |
"eval_samples": 55176, | |
"eval_samples_per_second": 105.381, | |
"eval_steps_per_second": 2.196, | |
"total_flos": 1.2345107794414797e+18, | |
"train_loss": 3.067183213959159, | |
"train_runtime": 46797.6916, | |
"train_samples": 5495866, | |
"train_samples_per_second": 11743.883, | |
"train_steps_per_second": 244.666 | |
} |