{ "epoch": 0.998691442030882, "eval_logits/chosen": -0.7125873565673828, "eval_logits/rejected": -0.7502822279930115, "eval_logps/chosen": -405.15185546875, "eval_logps/rejected": -435.5634460449219, "eval_loss": 0.5485080480575562, "eval_rewards/accuracies": 0.7379999756813049, "eval_rewards/chosen": -1.143401861190796, "eval_rewards/margins": 0.5365331768989563, "eval_rewards/rejected": -1.679935097694397, "eval_runtime": 355.0474, "eval_samples": 2000, "eval_samples_per_second": 5.633, "eval_steps_per_second": 1.408 }