distilled-mt5-small-0.05-1 / all_results.json
Lvxue's picture
End of training
898199c
{
"epoch": 5.0,
"eval_bleu": 6.997,
"eval_gen_len": 46.2551,
"eval_loss": 2.810580015182495,
"eval_runtime": 620.2548,
"eval_samples": 1999,
"eval_samples_per_second": 3.223,
"eval_steps_per_second": 0.403,
"train_loss": 11.335328515625,
"train_runtime": 2800.5936,
"train_samples": 10000,
"train_samples_per_second": 17.853,
"train_steps_per_second": 4.463
}