{ "epoch": 1.0, "eval_logits/chosen": -0.8007283806800842, "eval_logits/rejected": -0.7758755683898926, "eval_logps/chosen": -1081.9208984375, "eval_logps/rejected": -1242.8665771484375, "eval_loss": 0.6785902976989746, "eval_rewards/accuracies": 0.6244725584983826, "eval_rewards/chosen": -0.003962064627557993, "eval_rewards/margins": 0.032243408262729645, "eval_rewards/rejected": -0.0362054705619812, "eval_runtime": 850.5886, "eval_samples": 7584, "eval_samples_per_second": 8.916, "eval_steps_per_second": 0.279 }