math_phi3_dpo_20_0 / all_results.json
lzc0525's picture
Upload folder using huggingface_hub
f625c53 verified
raw
history blame contribute delete
888 Bytes
{
"epoch": 0.9880609304240429,
"eval_logits/chosen": 9.158658981323242,
"eval_logits/rejected": 9.958081245422363,
"eval_logps/chosen": -110.41038513183594,
"eval_logps/ref_chosen": -106.16099548339844,
"eval_logps/ref_rejected": -119.78473663330078,
"eval_logps/rejected": -124.09846496582031,
"eval_loss": 0.6929683089256287,
"eval_rewards/accuracies": 0.4972222149372101,
"eval_rewards/chosen": -0.04249410331249237,
"eval_rewards/margins": 0.0006433044327422976,
"eval_rewards/rejected": -0.043137405067682266,
"eval_runtime": 159.1867,
"eval_samples": 1080,
"eval_samples_per_second": 6.784,
"eval_steps_per_second": 1.696,
"total_flos": 0.0,
"train_loss": 0.6922952850659688,
"train_runtime": 7631.3864,
"train_samples": 9715,
"train_samples_per_second": 1.273,
"train_steps_per_second": 0.01
}