starchat2-15b-v0.1 / all_results.json
lewtun's picture
lewtun HF staff
Add HuggingFaceH4/starcoder2-15b-dpo-v4.0 checkpoint
3dcc536 verified
raw
history blame
748 Bytes
{
"epoch": 2.0,
"eval_logits/chosen": -2.3005340099334717,
"eval_logits/rejected": -2.3817031383514404,
"eval_logps/chosen": -316.1898498535156,
"eval_logps/rejected": -322.1933898925781,
"eval_loss": 0.4346597194671631,
"eval_rewards/accuracies": 0.7658227682113647,
"eval_rewards/chosen": -0.9460535049438477,
"eval_rewards/margins": 1.8284220695495605,
"eval_rewards/rejected": -2.7744758129119873,
"eval_runtime": 117.6177,
"eval_samples": 2500,
"eval_samples_per_second": 21.255,
"eval_steps_per_second": 0.672,
"train_loss": 0.5184940074794384,
"train_runtime": 19743.6623,
"train_samples": 73494,
"train_samples_per_second": 7.445,
"train_steps_per_second": 0.058
}