{ "epoch": 2.0, "eval_logits/chosen": 0.7325530052185059, "eval_logits/rejected": 0.7531598806381226, "eval_logps/chosen": -94.8434829711914, "eval_logps/rejected": -98.55415344238281, "eval_loss": 0.687246561050415, "eval_rewards/accuracies": 0.33399999141693115, "eval_rewards/chosen": -0.03116113506257534, "eval_rewards/margins": 0.012410260736942291, "eval_rewards/rejected": -0.04357139766216278, "eval_runtime": 272.5724, "eval_samples": 2000, "eval_samples_per_second": 7.337, "eval_steps_per_second": 0.459 }