jamba-900M-v0.13-KIx2 / all_results.json
pszemraj's picture
End of training
1058833 verified
raw
history blame
533 Bytes
{
"epoch": 1.997349589186324,
"eval_accuracy": 0.45143400679566215,
"eval_loss": 3.0366320610046387,
"eval_runtime": 36.3403,
"eval_samples": 300,
"eval_samples_per_second": 8.255,
"eval_steps_per_second": 2.064,
"num_input_tokens_seen": 1975517184,
"perplexity": 20.83495408242377,
"total_flos": 9.732316690586272e+18,
"train_loss": 3.186332613039928,
"train_runtime": 34789.3198,
"train_samples": 60368,
"train_samples_per_second": 3.47,
"train_steps_per_second": 0.027
}