{ | |
"epoch": 19.995409685563462, | |
"eval_accuracy": 0.7611848617176128, | |
"eval_loss": 0.5757241249084473, | |
"eval_runtime": 9.1382, | |
"eval_samples": 500, | |
"eval_samples_per_second": 54.716, | |
"eval_steps_per_second": 6.894, | |
"perplexity": 1.7784178574319338, | |
"total_flos": 2.2953223726028554e+18, | |
"train_loss": 0.6653460843285034, | |
"train_runtime": 50472.5887, | |
"train_samples": 34854, | |
"train_samples_per_second": 13.811, | |
"train_steps_per_second": 0.432 | |
} |