zephyr-7b / eval_results.json
jikaixuan's picture
End of training
bdfa771 verified
raw
history blame
655 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": -0.24525223672389984,
"eval_logits/rejected": -0.1380803883075714,
"eval_logps/chosen": -103.02954864501953,
"eval_logps/rejected": -131.91891479492188,
"eval_loss": 0.6906174421310425,
"eval_pred_label": 4192.14306640625,
"eval_rewards/accuracies": 0.363095223903656,
"eval_rewards/chosen": -0.3412899374961853,
"eval_rewards/margins": 0.22391849756240845,
"eval_rewards/rejected": -0.5652084350585938,
"eval_runtime": 247.5585,
"eval_samples": 2000,
"eval_samples_per_second": 8.079,
"eval_steps_per_second": 0.254,
"eval_use_label": 15879.857421875
}