{ | |
"epoch": 0.018308631211857017, | |
"eval_accuracy": 0.08509852797509099, | |
"eval_loss": 9.4765625, | |
"eval_runtime": 276.521, | |
"eval_samples": 33767, | |
"eval_samples_per_second": 122.114, | |
"eval_steps_per_second": 3.392, | |
"perplexity": 13050.249090978768, | |
"total_flos": 352197518819328.0, | |
"train_loss": 10.035667782738095, | |
"train_runtime": 94125.7847, | |
"train_samples": 660643, | |
"train_samples_per_second": 701.873, | |
"train_steps_per_second": 19.497 | |
} |