{ "epoch": 1.0, "eval_loss": 1.950162649154663, "eval_runtime": 116.7358, "eval_samples_per_second": 22.041, "eval_steps_per_second": 2.758, "perplexity": 7.029830883658786, "total_flos": 2.1665532198912e+17, "train_loss": 2.01907276283447, "train_runtime": 3147.1141, "train_samples_per_second": 7.559, "train_steps_per_second": 3.78 }