distilled-mt5-small-0.6-1 / all_results.json
Lvxue's picture
End of training
abf975c
{
"epoch": 5.0,
"eval_bleu": 6.7165,
"eval_gen_len": 46.3377,
"eval_loss": 2.8345110416412354,
"eval_runtime": 694.5313,
"eval_samples": 1999,
"eval_samples_per_second": 2.878,
"eval_steps_per_second": 0.36,
"train_loss": 100.5107753125,
"train_runtime": 2803.7853,
"train_samples": 10000,
"train_samples_per_second": 17.833,
"train_steps_per_second": 4.458
}