{ | |
"epoch": 3.0, | |
"eval_loss": 3.9845974445343018, | |
"eval_runtime": 1425.6748, | |
"eval_samples": 32253, | |
"eval_samples_per_second": 22.623, | |
"eval_steps_per_second": 3.771, | |
"perplexity": 53.7636422730289, | |
"train_loss": 0.7859680134460877, | |
"train_runtime": 210975.8843, | |
"train_samples": 3196485, | |
"train_samples_per_second": 45.453, | |
"train_steps_per_second": 7.575 | |
} |