math_phi3_dpo_100_60 / eval_results.json
lzc0525's picture
Upload folder using huggingface_hub
6560999 verified
raw
history blame contribute delete
729 Bytes
{
"epoch": 0.9880609304240429,
"eval_logits/chosen": 9.331795692443848,
"eval_logits/rejected": 10.156203269958496,
"eval_logps/chosen": -80.09001922607422,
"eval_logps/ref_chosen": -106.16099548339844,
"eval_logps/ref_rejected": -119.78473663330078,
"eval_logps/rejected": -93.58577728271484,
"eval_loss": 0.44601914286613464,
"eval_rewards/accuracies": 0.5018518567085266,
"eval_rewards/chosen": 0.2607097327709198,
"eval_rewards/margins": -0.001279854099266231,
"eval_rewards/rejected": 0.261989563703537,
"eval_runtime": 192.9589,
"eval_samples": 1080,
"eval_samples_per_second": 5.597,
"eval_sft_loss": 0.27996528148651123,
"eval_steps_per_second": 1.399
}