{ | |
"epoch": 0.2328830926874709, | |
"eval_accuracy": 0.7678859647632478, | |
"eval_loss": 0.9773336052894592, | |
"eval_runtime": 27.5702, | |
"eval_samples": 581, | |
"eval_samples_per_second": 21.073, | |
"eval_steps_per_second": 0.363, | |
"perplexity": 2.6573612131766415, | |
"total_flos": 1.3069163715939533e+18, | |
"train_loss": 1.361302978515625, | |
"train_runtime": 10712.6155, | |
"train_samples": 274768, | |
"train_samples_per_second": 76.947, | |
"train_steps_per_second": 1.203 | |
} |