smolm-autoreg-bpe-seed_444 / all_results.json
kanishka's picture
End of training
594dc88 verified
raw
history blame
443 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.4995467750899875,
"eval_loss": 2.4751720428466797,
"eval_runtime": 3.3732,
"eval_samples": 4491,
"eval_samples_per_second": 1331.385,
"eval_steps_per_second": 10.672,
"perplexity": 11.883751451666422,
"train_loss": 2.5668444753344595,
"train_runtime": 741.451,
"train_samples": 46845,
"train_samples_per_second": 631.802,
"train_steps_per_second": 39.49
}