chessgpt-medium-s / all_results.json
dakwi's picture
End of training
487c4d3 verified
{
"epoch": 0.99968,
"eval_loss": 1.097437858581543,
"eval_runtime": 230.0389,
"eval_samples": 12500,
"eval_samples_per_second": 54.339,
"eval_steps_per_second": 6.795,
"perplexity": 2.9964787778596422,
"total_flos": 6.457467788899123e+16,
"train_loss": 1.3367621437688184,
"train_runtime": 11215.3396,
"train_samples": 100000,
"train_samples_per_second": 8.916,
"train_steps_per_second": 0.139
}