minitron-4b-tulu-v2-mix / all_results.json
kykim0's picture
End of training
13d891d verified
raw
history blame
414 Bytes
{
"epoch": 0.008827099194527198,
"eval_loss": 1.1978037357330322,
"eval_runtime": 365.9654,
"eval_samples": 25000,
"eval_samples_per_second": 15.204,
"eval_steps_per_second": 3.801,
"total_flos": 6242130984960.0,
"train_loss": 1.322617530822754,
"train_runtime": 636.4506,
"train_samples": 326149,
"train_samples_per_second": 1.006,
"train_steps_per_second": 0.008
}