{ "epoch": 3.0, "eval_loss": 3.5185182094573975, "eval_runtime": 2.7592, "eval_samples": 7, "eval_samples_per_second": 2.537, "eval_steps_per_second": 0.362, "perplexity": 33.734404089240414, "train_loss": 3.5635623023623513, "train_runtime": 37.6452, "train_samples": 14, "train_samples_per_second": 1.116, "train_steps_per_second": 0.558 }