{ "epoch": 0.0, "eval_loss": 44.2744026184082, "eval_runtime": 2.6297, "eval_samples": 437, "eval_samples_per_second": 166.177, "eval_steps_per_second": 14.07, "perplexity": 1.6909421376838556e+19, "train_loss": 41.470333099365234, "train_runtime": 8.8744, "train_samples": 4005, "train_samples_per_second": 1.352, "train_steps_per_second": 0.113 }