math_llama3_reset_dpo_100_0_0.0 / eval_results.json
lzc0525's picture
Upload folder using huggingface_hub
da085a6 verified
raw
history blame contribute delete
698 Bytes
{
"epoch": 0.9182209469153515,
"eval_logits/chosen": -0.01766319014132023,
"eval_logits/rejected": 0.14318932592868805,
"eval_logps/chosen": -138.21542358398438,
"eval_logps/ref_chosen": -134.78414916992188,
"eval_logps/ref_rejected": -171.45664978027344,
"eval_logps/rejected": -174.8708953857422,
"eval_loss": 0.693236768245697,
"eval_rewards/accuracies": 0.47777777910232544,
"eval_rewards/chosen": -0.034312743693590164,
"eval_rewards/margins": -0.0001707002375042066,
"eval_rewards/rejected": -0.03414204344153404,
"eval_runtime": 143.4155,
"eval_samples": 1080,
"eval_samples_per_second": 7.531,
"eval_steps_per_second": 1.883
}