|
{ |
|
"epoch": 0.9995419147961521, |
|
"eval_logits/chosen": -0.6407761573791504, |
|
"eval_logits/rejected": -0.6567662358283997, |
|
"eval_logps/chosen": -200.93621826171875, |
|
"eval_logps/rejected": -276.8379821777344, |
|
"eval_loss": 0.30047258734703064, |
|
"eval_rewards/accuracies": 0.8699421882629395, |
|
"eval_rewards/chosen": 1.6737332344055176, |
|
"eval_rewards/margins": 2.166951894760132, |
|
"eval_rewards/rejected": -0.4932188391685486, |
|
"eval_runtime": 252.7931, |
|
"eval_samples": 2763, |
|
"eval_samples_per_second": 10.93, |
|
"eval_steps_per_second": 1.369 |
|
} |