|
{ |
|
"epoch": 0.9880609304240429, |
|
"eval_logits/chosen": 9.35390567779541, |
|
"eval_logits/rejected": 10.18101692199707, |
|
"eval_logps/chosen": -0.37907084822654724, |
|
"eval_logps/rejected": -0.3889653980731964, |
|
"eval_loss": 1.382422924041748, |
|
"eval_rewards/accuracies": 0.5287036895751953, |
|
"eval_rewards/chosen": -0.7581416964530945, |
|
"eval_rewards/margins": 0.019789105281233788, |
|
"eval_rewards/rejected": -0.7779307961463928, |
|
"eval_runtime": 152.7821, |
|
"eval_samples": 1080, |
|
"eval_samples_per_second": 7.069, |
|
"eval_steps_per_second": 1.767, |
|
"total_flos": 0.0, |
|
"train_loss": 1.3895690520604451, |
|
"train_runtime": 7857.9562, |
|
"train_samples": 9715, |
|
"train_samples_per_second": 1.236, |
|
"train_steps_per_second": 0.01 |
|
} |