math_phi3_dpo_100_100 / all_results.json
lzc0525's picture
Upload folder using huggingface_hub
82e400f verified
raw
history blame contribute delete
928 Bytes
{
"epoch": 0.9880609304240429,
"eval_logits/chosen": 9.246881484985352,
"eval_logits/rejected": 10.068053245544434,
"eval_logps/chosen": -74.92684936523438,
"eval_logps/ref_chosen": -106.16099548339844,
"eval_logps/ref_rejected": -119.78473663330078,
"eval_logps/rejected": -87.84820556640625,
"eval_loss": 0.26139113306999207,
"eval_rewards/accuracies": 0.47962963581085205,
"eval_rewards/chosen": 0.3123414218425751,
"eval_rewards/margins": -0.007023785263299942,
"eval_rewards/rejected": 0.3193652033805847,
"eval_runtime": 165.9841,
"eval_samples": 1080,
"eval_samples_per_second": 6.507,
"eval_sft_loss": 0.26139113306999207,
"eval_steps_per_second": 1.627,
"total_flos": 0.0,
"train_loss": 0.29937881012757617,
"train_runtime": 8120.0447,
"train_samples": 9715,
"train_samples_per_second": 1.196,
"train_steps_per_second": 0.009
}