| { | |
| "epoch": 0.998691442030882, | |
| "eval_logits/chosen": -0.8399364352226257, | |
| "eval_logits/rejected": -0.8775278329849243, | |
| "eval_logps/chosen": -316.6497802734375, | |
| "eval_logps/rejected": -344.29437255859375, | |
| "eval_loss": 0.5597857236862183, | |
| "eval_rewards/accuracies": 0.7239999771118164, | |
| "eval_rewards/chosen": -0.25838080048561096, | |
| "eval_rewards/margins": 0.5088632106781006, | |
| "eval_rewards/rejected": -0.7672439813613892, | |
| "eval_runtime": 355.4568, | |
| "eval_samples": 2000, | |
| "eval_samples_per_second": 5.627, | |
| "eval_steps_per_second": 1.407 | |
| } |