byt5-base-es_mim / all_results.json
mekjr1's picture
End of training
b973a65
{
"epoch": 10.0,
"eval_bleu": 8.1209,
"eval_gen_len": 100.8969,
"eval_loss": 0.5602744221687317,
"eval_runtime": 140.6184,
"eval_samples": 795,
"eval_samples_per_second": 5.654,
"eval_steps_per_second": 0.356,
"predict_bleu": 8.5941,
"predict_gen_len": 100.9183,
"predict_loss": 0.5462395548820496,
"predict_runtime": 139.8574,
"predict_samples": 796,
"predict_samples_per_second": 5.692,
"predict_steps_per_second": 0.358,
"total_flos": 2.26168179720192e+16,
"train_loss": 0.7384387069012053,
"train_runtime": 2101.0033,
"train_samples": 6360,
"train_samples_per_second": 30.271,
"train_steps_per_second": 1.894
}