distilled-mt5-small-b5 / all_results.json
Lvxue's picture
End of training
bb3294b
raw
history blame
414 Bytes
{
"epoch": 5.0,
"eval_bleu": 7.3798,
"eval_gen_len": 44.7109,
"eval_loss": 2.7944588661193848,
"eval_runtime": 569.4253,
"eval_samples": 1999,
"eval_samples_per_second": 3.511,
"eval_steps_per_second": 0.439,
"train_loss": 4.99171919921875,
"train_runtime": 2742.9735,
"train_samples": 10000,
"train_samples_per_second": 18.228,
"train_steps_per_second": 4.557
}