{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.4074434673767711, | |
"eval_loss": 3.400710105895996, | |
"eval_runtime": 157.1955, | |
"eval_samples": 57921, | |
"eval_samples_per_second": 368.465, | |
"eval_steps_per_second": 5.764, | |
"perplexity": 29.98538528800189, | |
"total_flos": 1.5669257538816e+18, | |
"train_loss": 3.15551687307786, | |
"train_runtime": 81149.9259, | |
"train_samples": 595035, | |
"train_samples_per_second": 146.651, | |
"train_steps_per_second": 4.583 | |
} |