{ "epoch": 1.0, "eval_loss": 1.9279512166976929, "eval_runtime": 9.703, "eval_samples_per_second": 13.604, "eval_steps_per_second": 1.752, "perplexity": 6.875409577572064, "total_flos": 1.80550985908224e+16, "train_loss": 2.145273788114429, "train_runtime": 315.4776, "train_samples_per_second": 6.298, "train_steps_per_second": 3.151 }