{ | |
"epoch": 2.0, | |
"eval_logits/chosen": -2.3005340099334717, | |
"eval_logits/rejected": -2.3817031383514404, | |
"eval_logps/chosen": -316.1898498535156, | |
"eval_logps/rejected": -322.1933898925781, | |
"eval_loss": 0.4346597194671631, | |
"eval_rewards/accuracies": 0.7658227682113647, | |
"eval_rewards/chosen": -0.9460535049438477, | |
"eval_rewards/margins": 1.8284220695495605, | |
"eval_rewards/rejected": -2.7744758129119873, | |
"eval_runtime": 117.6177, | |
"eval_samples": 2500, | |
"eval_samples_per_second": 21.255, | |
"eval_steps_per_second": 0.672, | |
"train_loss": 0.5184940074794384, | |
"train_runtime": 19743.6623, | |
"train_samples": 73494, | |
"train_samples_per_second": 7.445, | |
"train_steps_per_second": 0.058 | |
} |