{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.4167961357023813, | |
"eval_loss": 6.040319442749023, | |
"eval_runtime": 1.0257, | |
"eval_samples": 479, | |
"eval_samples_per_second": 466.985, | |
"eval_steps_per_second": 2.925, | |
"perplexity": 420.0271880980293, | |
"total_flos": 3.051148107142656e+17, | |
"train_loss": 7.903556559985129, | |
"train_runtime": 20916.6184, | |
"train_samples": 228639, | |
"train_samples_per_second": 273.274, | |
"train_steps_per_second": 1.708 | |
} |