qwen2.5-0.5b-expo-L2EXPO-ES-100 / eval_results.json
hZzy's picture
End of training
f06764c verified
raw
history blame
594 Bytes
{
"epoch": 2.9806329711856403,
"eval_dpo_loss": 245.87562561035156,
"eval_logits": -0.5435077548027039,
"eval_logps": -82.8267593383789,
"eval_loss": 486.1625671386719,
"eval_objective": 489.7927551269531,
"eval_ranking_idealized": 0.5212215185165405,
"eval_ranking_idealized_expo": 0.5212215185165405,
"eval_ranking_simple": 0.5253623127937317,
"eval_regularize": 489.7927551269531,
"eval_runtime": 308.4786,
"eval_samples": 5790,
"eval_samples_per_second": 18.77,
"eval_steps_per_second": 1.566,
"eval_wo_beta": 14.046432495117188
}