{ "epoch": 94.78, "eval_accuracy": 0.4534356430493973, "eval_loss": 3.1695425510406494, "eval_runtime": 128.1811, "eval_samples": 24055, "eval_samples_per_second": 187.664, "eval_steps_per_second": 5.867, "perplexity": 23.796596138077017, "train_loss": 3.832834072322636, "train_runtime": 39205.3218, "train_samples": 24910, "train_samples_per_second": 63.537, "train_steps_per_second": 0.122 }