zephyr-7b-dpo-lora / all_results.json
diyali95916's picture
Model save
edf51ed verified
raw
history blame contribute delete
722 Bytes
{
"epoch": 2.76,
"eval_logits/chosen": -2.274653911590576,
"eval_logits/rejected": -2.2999308109283447,
"eval_logps/chosen": -190.57220458984375,
"eval_logps/rejected": -132.8740234375,
"eval_loss": 0.68434077501297,
"eval_rewards/accuracies": 0.5,
"eval_rewards/chosen": 0.04404526203870773,
"eval_rewards/margins": 0.03693275526165962,
"eval_rewards/rejected": 0.0071125030517578125,
"eval_runtime": 6.6846,
"eval_samples": 30,
"eval_samples_per_second": 4.488,
"eval_steps_per_second": 0.15,
"train_loss": 0.6927925229072571,
"train_runtime": 943.7212,
"train_samples": 922,
"train_samples_per_second": 4.885,
"train_steps_per_second": 0.005
}