{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.25270675362470885, | |
"eval_loss": 5.005028247833252, | |
"eval_runtime": 10.9985, | |
"eval_samples": 4053, | |
"eval_samples_per_second": 368.506, | |
"eval_steps_per_second": 92.195, | |
"perplexity": 149.16129658231105, | |
"total_flos": 488922611712000.0, | |
"train_loss": 5.48259629872295, | |
"train_runtime": 4495.3437, | |
"train_samples": 80219, | |
"train_samples_per_second": 356.898, | |
"train_steps_per_second": 22.308 | |
} |