{ "epoch": 1.53, "eval_accuracy": 2.9114457332740555e-05, "eval_loss": NaN, "eval_runtime": 1244.2688, "eval_samples": 308356, "eval_samples_per_second": 247.821, "eval_steps_per_second": 3.873, "perplexity": NaN, "train_loss": 0.3459514281929236, "train_runtime": 108836.6872, "train_samples": 5858758, "train_samples_per_second": 269.154, "train_steps_per_second": 4.206 }