|
{ |
|
"epoch": 0.9880609304240429, |
|
"eval_logits/chosen": 9.28704833984375, |
|
"eval_logits/rejected": 10.111818313598633, |
|
"eval_logps/chosen": -77.38970184326172, |
|
"eval_logps/ref_chosen": -106.16099548339844, |
|
"eval_logps/ref_rejected": -119.78473663330078, |
|
"eval_logps/rejected": -90.60062408447266, |
|
"eval_loss": 0.3555455803871155, |
|
"eval_rewards/accuracies": 0.4879629611968994, |
|
"eval_rewards/chosen": 0.2877129316329956, |
|
"eval_rewards/margins": -0.004128198605030775, |
|
"eval_rewards/rejected": 0.2918411195278168, |
|
"eval_runtime": 199.7246, |
|
"eval_samples": 1080, |
|
"eval_samples_per_second": 5.407, |
|
"eval_sft_loss": 0.2702542543411255, |
|
"eval_steps_per_second": 1.352 |
|
} |