{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.155817370175736, | |
"eval_loss": 8.267388343811035, | |
"eval_runtime": 0.7261, | |
"eval_samples": 479, | |
"eval_samples_per_second": 659.726, | |
"eval_steps_per_second": 6.886, | |
"perplexity": 3894.7639137017945, | |
"total_flos": 1.5151126801503744e+18, | |
"train_loss": 8.487465922806464, | |
"train_runtime": 17081.4633, | |
"train_samples": 228639, | |
"train_samples_per_second": 334.63, | |
"train_steps_per_second": 3.486 | |
} |