{ "epoch": 9.852216748768473, "eval_accuracy": 0.3451256113828368, "eval_loss": 3.7245092391967773, "eval_runtime": 6.0968, "eval_samples": 44, "eval_samples_per_second": 7.217, "eval_steps_per_second": 7.217, "perplexity": 41.4508852826151, "total_flos": 3.70944044433408e+17, "train_loss": 4.3953623046875, "train_runtime": 3726.3159, "train_samples": 812, "train_samples_per_second": 2.179, "train_steps_per_second": 0.134 }