zephyr-7b-dpo-lora / all_results.json
diyali95916's picture
Model save
2567823 verified
raw
history blame
727 Bytes
{
"epoch": 4.0,
"eval_logits/chosen": -2.1724095344543457,
"eval_logits/rejected": -2.2160496711730957,
"eval_logps/chosen": -102.96302795410156,
"eval_logps/rejected": -101.06044006347656,
"eval_loss": 0.6873850226402283,
"eval_rewards/accuracies": 1.0,
"eval_rewards/chosen": 0.08033924549818039,
"eval_rewards/margins": 0.05054035410284996,
"eval_rewards/rejected": 0.02979888767004013,
"eval_runtime": 6.0716,
"eval_samples": 30,
"eval_samples_per_second": 4.941,
"eval_steps_per_second": 0.165,
"train_loss": 0.6922631859779358,
"train_runtime": 883.8621,
"train_samples": 626,
"train_samples_per_second": 3.541,
"train_steps_per_second": 0.006
}