{ "epoch": 20.0, "eval_accuracy": 0.4112049304778943, "eval_loss": 3.4044251441955566, "eval_runtime": 224.9856, "eval_samples": 57921, "eval_samples_per_second": 257.443, "eval_steps_per_second": 2.013, "perplexity": 30.096989321043814, "train_loss": 3.025763815510302, "train_runtime": 112290.5798, "train_samples": 595034, "train_samples_per_second": 105.981, "train_steps_per_second": 3.312 }