{ "epoch": 20.0, "eval_accuracy": 0.41106143702911596, "eval_loss": 3.407801628112793, "eval_runtime": 225.6692, "eval_samples": 57921, "eval_samples_per_second": 256.663, "eval_steps_per_second": 2.007, "perplexity": 30.198783077224352, "train_loss": 3.0278301616277896, "train_runtime": 112002.0514, "train_samples": 595034, "train_samples_per_second": 106.254, "train_steps_per_second": 3.32 }