{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.7981434977578475, | |
"eval_loss": 0.43110987544059753, | |
"eval_runtime": 7.0185, | |
"eval_samples": 500, | |
"eval_samples_per_second": 71.24, | |
"eval_steps_per_second": 8.976, | |
"perplexity": 1.5389646350848876, | |
"total_flos": 9.64242245391745e+17, | |
"train_loss": 0.3966417311720677, | |
"train_runtime": 24179.107, | |
"train_samples": 16925, | |
"train_samples_per_second": 14.0, | |
"train_steps_per_second": 0.438 | |
} |