{ "epoch": 6.84, "eval_loss": 1.0630253553390503, "eval_runtime": 417.3757, "eval_samples": 1000, "eval_samples_per_second": 6.881, "eval_steps_per_second": 3.441, "perplexity": 2.895116509633705, "train_loss": 0.8530817114257813, "train_runtime": 94563.3332, "train_samples": 10000, "train_samples_per_second": 2.115, "train_steps_per_second": 0.264 }