{ "epoch": 25.0, "eval_accuracy": 0.16143611762379595, "eval_loss": 7.2607574462890625, "eval_runtime": 1.0106, "eval_samples": 479, "eval_samples_per_second": 473.96, "eval_steps_per_second": 2.968, "perplexity": 1423.334228232389, "total_flos": 3.049796905526016e+17, "train_loss": 7.630663348358774, "train_runtime": 20886.7559, "train_samples": 228639, "train_samples_per_second": 273.665, "train_steps_per_second": 1.71 }