ruDialoGPT-medium / all_results.json
d.tsimerman
squash
cc2664b
{
"epoch": 1.0,
"eval_loss": 3.4997777938842773,
"eval_runtime": 448.829,
"eval_samples": 40311,
"eval_samples_per_second": 89.814,
"eval_steps_per_second": 7.486,
"perplexity": 33.10809432022858,
"train_loss": 3.4927627832876236,
"train_runtime": 361845.2402,
"train_samples": 8570756,
"train_samples_per_second": 23.686,
"train_steps_per_second": 1.974
}