{ "epoch": 1.0, "eval_loss": 2.216308832168579, "eval_runtime": 127.3922, "eval_samples_per_second": 246.271, "eval_steps_per_second": 15.393, "perplexity": 9.173407708925824, "total_flos": 1.59124040841796e+18, "train_loss": 2.428147726093893, "train_runtime": 2109.7476, "train_samples_per_second": 82.811, "train_steps_per_second": 5.176 }