{ "epoch": 3.0, "eval_loss": 3.6250336170196533, "eval_runtime": 0.6213, "eval_samples": 5, "eval_samples_per_second": 8.048, "eval_steps_per_second": 1.61, "perplexity": 37.525984650160595, "train_loss": 3.7773597353980657, "train_runtime": 16.24, "train_samples": 13, "train_samples_per_second": 2.401, "train_steps_per_second": 1.293 }