{ | |
"epoch": 0.9981298423724285, | |
"eval_logits/chosen": -1.1943395137786865, | |
"eval_logits/rejected": -1.1611931324005127, | |
"eval_logps/chosen": -1.2059502601623535, | |
"eval_logps/rejected": -1.4740996360778809, | |
"eval_loss": 1.373450517654419, | |
"eval_rewards/accuracies": 0.6653226017951965, | |
"eval_rewards/chosen": -3.0148754119873047, | |
"eval_rewards/margins": 0.6703741550445557, | |
"eval_rewards/rejected": -3.6852493286132812, | |
"eval_runtime": 71.4975, | |
"eval_samples": 1961, | |
"eval_samples_per_second": 27.428, | |
"eval_steps_per_second": 0.867 | |
} |