| { | |
| "epoch": 0.9999183606825047, | |
| "eval_logits/chosen": -0.67052161693573, | |
| "eval_logits/rejected": -0.61020427942276, | |
| "eval_logps/chosen": -990.1327514648438, | |
| "eval_logps/rejected": -1154.4678955078125, | |
| "eval_loss": 0.38660529255867004, | |
| "eval_rewards/accuracies": 0.8059999942779541, | |
| "eval_rewards/chosen": -5.162255764007568, | |
| "eval_rewards/margins": 1.7307368516921997, | |
| "eval_rewards/rejected": -6.89299201965332, | |
| "eval_runtime": 614.9178, | |
| "eval_samples": 4000, | |
| "eval_samples_per_second": 6.505, | |
| "eval_steps_per_second": 0.407 | |
| } |