{ | |
"epoch": 0.39269681566490244, | |
"eval_accuracy": 0.3771482663988522, | |
"eval_loss": 3.1479039192199707, | |
"eval_perplexity": 23.287201532831283, | |
"eval_runtime": 674.2767, | |
"eval_samples": 55176, | |
"eval_samples_per_second": 81.83, | |
"eval_steps_per_second": 1.706, | |
"total_flos": 1.1278534630535332e+18, | |
"train_loss": 3.096997114293975, | |
"train_runtime": 46795.6115, | |
"train_samples": 5495866, | |
"train_samples_per_second": 11744.405, | |
"train_steps_per_second": 244.677 | |
} |