phi-2-gpo-renew2-i0 / eval_results.json
BraylonDash's picture
Model save
2f18277 verified
raw
history blame
575 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": 0.937932550907135,
"eval_logits/rejected": 1.0401638746261597,
"eval_logps/chosen": -280.182861328125,
"eval_logps/rejected": -252.35885620117188,
"eval_loss": 0.034593481570482254,
"eval_rewards/accuracies": 0.6290000081062317,
"eval_rewards/chosen": -0.02636060118675232,
"eval_rewards/margins": 0.059068720787763596,
"eval_rewards/rejected": -0.08542931824922562,
"eval_runtime": 538.4763,
"eval_samples": 2000,
"eval_samples_per_second": 3.714,
"eval_steps_per_second": 0.929
}