{ | |
"epoch": 19.998892396300604, | |
"eval_accuracy": 0.47865689612852264, | |
"eval_loss": 2.6880221366882324, | |
"eval_runtime": 120.6441, | |
"eval_samples": 60791, | |
"eval_samples_per_second": 503.887, | |
"eval_steps_per_second": 7.874, | |
"perplexity": 14.702567474871172, | |
"total_flos": 1.50966240067584e+18, | |
"train_loss": 2.8030111154835997, | |
"train_runtime": 43302.4979, | |
"train_samples": 577799, | |
"train_samples_per_second": 266.866, | |
"train_steps_per_second": 1.042 | |
} |