BertjeWDialDataALL03 / all_results.json
Jeska's picture
End of training
67cd60c
{
"epoch": 8.0,
"eval_loss": 1.9459083080291748,
"eval_runtime": 80.6558,
"eval_samples": 5193,
"eval_samples_per_second": 64.385,
"eval_steps_per_second": 8.059,
"perplexity": 6.999987112828894,
"train_loss": 2.0216803000285624,
"train_runtime": 46553.0134,
"train_samples": 98673,
"train_samples_per_second": 16.957,
"train_steps_per_second": 0.265
}