BertjeWDialDataALLQonly / all_results.json
Jeska's picture
End of training
7473103
{
"epoch": 15.0,
"eval_loss": 1.9438238143920898,
"eval_runtime": 45.4177,
"eval_samples": 2933,
"eval_samples_per_second": 64.578,
"eval_steps_per_second": 8.081,
"perplexity": 6.985410881541159,
"train_loss": 1.9284902631757455,
"train_runtime": 49525.3053,
"train_samples": 55736,
"train_samples_per_second": 16.881,
"train_steps_per_second": 0.264
}