{ | |
"epoch": 2.983957219251337, | |
"eval_logits/chosen": -1.9690638780593872, | |
"eval_logits/rejected": -1.9223570823669434, | |
"eval_logps/chosen": -233.67343139648438, | |
"eval_logps/rejected": -227.1739044189453, | |
"eval_loss": 0.5413760542869568, | |
"eval_rewards/accuracies": 0.7767857313156128, | |
"eval_rewards/chosen": 0.5871802568435669, | |
"eval_rewards/margins": 2.1379942893981934, | |
"eval_rewards/rejected": -1.550813913345337, | |
"eval_runtime": 176.7918, | |
"eval_samples_per_second": 15.046, | |
"eval_steps_per_second": 0.238 | |
} |