smolm-mlm-bpe-unmask-seed_111 / all_results.json
kanishka's picture
End of training
c7994a3
raw
history blame
No virus
447 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.44921721224601036,
"eval_loss": 2.69555401802063,
"eval_runtime": 8.7444,
"eval_samples": 70000,
"eval_samples_per_second": 8005.085,
"eval_steps_per_second": 15.667,
"perplexity": 14.813723550074597,
"train_loss": 3.080881611061448,
"train_runtime": 7359.6812,
"train_samples": 763989,
"train_samples_per_second": 1038.074,
"train_steps_per_second": 16.221
}