distilled-mt5-small-0.8-1 / all_results.json
Lvxue's picture
End of training
5af3de5
raw
history blame contribute delete
412 Bytes
{
"epoch": 5.0,
"eval_bleu": 6.6553,
"eval_gen_len": 45.5138,
"eval_loss": 2.8309686183929443,
"eval_runtime": 636.8376,
"eval_samples": 1999,
"eval_samples_per_second": 3.139,
"eval_steps_per_second": 0.393,
"train_loss": 133.9536453125,
"train_runtime": 2736.2059,
"train_samples": 10000,
"train_samples_per_second": 18.273,
"train_steps_per_second": 4.568
}