byt5-base-es_ngu / all_results.json
mekjr1's picture
End of training
d870ccc
raw
history blame
679 Bytes
{
"epoch": 10.0,
"eval_bleu": 0.0,
"eval_gen_len": 9.0,
"eval_loss": 0.734420120716095,
"eval_runtime": 14.2391,
"eval_samples": 793,
"eval_samples_per_second": 55.692,
"eval_steps_per_second": 3.511,
"predict_bleu": 0.0,
"predict_gen_len": 9.0,
"predict_loss": 0.7520648837089539,
"predict_runtime": 14.2551,
"predict_samples": 794,
"predict_samples_per_second": 55.699,
"predict_steps_per_second": 3.508,
"total_flos": 2212105531392000.0,
"train_loss": 1.0583241114388184,
"train_runtime": 517.4021,
"train_samples": 6345,
"train_samples_per_second": 122.632,
"train_steps_per_second": 7.673
}