{ | |
"epoch": 19.946666666666665, | |
"eval_accuracy": 0.5885829596412556, | |
"eval_loss": 3.0184407234191895, | |
"eval_runtime": 7.0977, | |
"eval_samples": 500, | |
"eval_samples_per_second": 70.445, | |
"eval_steps_per_second": 8.876, | |
"perplexity": 20.45936499070068, | |
"total_flos": 3.767212755417825e+17, | |
"train_loss": 0.406913380316872, | |
"train_runtime": 8744.2637, | |
"train_samples": 6000, | |
"train_samples_per_second": 13.723, | |
"train_steps_per_second": 0.428 | |
} |