{ "epoch": 1.0, "eval_loss": 3.4997777938842773, "eval_runtime": 448.829, "eval_samples": 40311, "eval_samples_per_second": 89.814, "eval_steps_per_second": 7.486, "perplexity": 33.10809432022858, "train_loss": 3.4927627832876236, "train_runtime": 361845.2402, "train_samples": 8570756, "train_samples_per_second": 23.686, "train_steps_per_second": 1.974 }